diff --git "a/profile_trace/iteration_12288/rank6_trace.json" "b/profile_trace/iteration_12288/rank6_trace.json" new file mode 100644--- /dev/null +++ "b/profile_trace/iteration_12288/rank6_trace.json" @@ -0,0 +1,68515 @@ + +{ + "schemaVersion": 1, + "deviceProperties": [ + { + "id": 0, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 1, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 2, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 3, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 4, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 5, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 6, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 7, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + } + ], + "cupti_version": 22, + "cuda_runtime_version": 12040, + "cuda_driver_version": 12080, + "distributedInfo": {"backend": "nccl", "rank": 6, "world_size": 8, "pg_count": 1, "pg_config": [{"pg_name": "0", "pg_desc": "default_pg", "backend_config": "cuda:nccl", "pg_size": 8, "ranks": [0, 1, 2, 3, 4, 5, 6, 7]}], "nccl_version": "2.21.5"}, + "record_shapes": 1, + "trace_id": "8ADBF4A35A1C431BAE48BB005E0E72AB", + "traceEvents": [ + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: DivBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115506875.331, "dur": 126.704, + "args": { + "External id": 229889,"Record function id": 0, "Sequence number": 2757958, "Fwd thread id": 1, "Ev Idx": 0 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "DivBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115506894.122, "dur": 97.224, + "args": { + "External id": 229890,"Sequence number": 2757958, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 1 + } + }, + { + "ph": "f", "id": 1, "pid": 4183442, "tid": 31331, "ts": 667115506894.122, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183442, "tid": 31331, + "ts": 667115506902.371, "dur": 86.806, + "args": { + "External id": 229891,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 2 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115507015.432, "dur": 236.269, + "args": { + "External id": 229892,"Record function id": 0, "Ev Idx": 3 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward", "pid": 4183442, "tid": 31331, + "ts": 667115507079.221, "dur": 100.364, + "args": { + "External id": 229893,"Record function id": 0, "Ev Idx": 4 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.19", "pid": 4183442, "tid": 31331, + "ts": 667115507114.197, "dur": 53.805, + "args": { + "External id": 229894,"Record function id": 0, "Ev Idx": 5 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115507184.529, "dur": 1.620, + "args": { + "External id": 229895,"Sequence number": 2757957, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6 + } + }, + { + "ph": "f", "id": 2, "pid": 4183442, "tid": 31331, "ts": 667115507184.529, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115507190.754, "dur": 55.559, + "args": { + "External id": 229896,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 7 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115507198.716, "dur": 47.071, + "args": { + "External id": 229897,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 8 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115507208.171, "dur": 3.008, + "args": { + "External id": 229898,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115507260.502, "dur": 16781.176, + "args": { + "External id": 229899,"Record function id": 0, "Sequence number": 2757955, "Fwd thread id": 1, "Ev Idx": 10 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115507262.475, "dur": 16768.530, + "args": { + "External id": 229900,"Sequence number": 2757955, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11 + } + }, + { + "ph": "f", "id": 3, "pid": 4183442, "tid": 31331, "ts": 667115507262.475, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115507308.576, "dur": 4.006, + "args": { + "External id": 229901,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 12 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115507317.826, "dur": 16599.414, + "args": { + "External id": 229902,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 13 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115507320.283, "dur": 16596.550, + "args": { + "External id": 229903,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 14 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115507325.113, "dur": 7.092, + "args": { + "External id": 229904,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 15 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115507334.608, "dur": 16581.020, + "args": { + "External id": 229905,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 16 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183442, "tid": 31331, + "ts": 667115523921.997, "dur": 0.478, + "args": { + "External id": 229906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 17 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183442, "tid": 31331, + "ts": 667115523924.917, "dur": 3.358, + "args": { + "External id": 229907,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 18 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183442, "tid": 31331, + "ts": 667115523926.887, "dur": 1.059, + "args": { + "External id": 229908,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 19 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 31331, + "ts": 667115523934.068, "dur": 31.684, + "args": { + "External id": 229909,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 20 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183442, "tid": 31331, + "ts": 667115523974.768, "dur": 46.337, + "args": { + "External id": 229910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 21 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 31331, + "ts": 667115523976.868, "dur": 44.020, + "args": { + "External id": 229911,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 22 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 31331, + "ts": 667115523978.654, "dur": 41.918, + "args": { + "External id": 229912,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 23 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524053.244, "dur": 20.356, + "args": { + "External id": 229913,"Record function id": 0, "Sequence number": 2757954, "Fwd thread id": 1, "Ev Idx": 24 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524054.902, "dur": 14.395, + "args": { + "External id": 229914,"Sequence number": 2757954, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 25 + } + }, + { + "ph": "f", "id": 4, "pid": 4183442, "tid": 31331, "ts": 667115524054.902, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115524058.740, "dur": 10.313, + "args": { + "External id": 229915,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 26 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115524062.768, "dur": 6.109, + "args": { + "External id": 229916,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 27 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524077.698, "dur": 99.274, + "args": { + "External id": 229917,"Record function id": 0, "Sequence number": 2757953, "Fwd thread id": 1, "Ev Idx": 28 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524078.688, "dur": 88.893, + "args": { + "External id": 229918,"Sequence number": 2757953, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 29 + } + }, + { + "ph": "f", "id": 5, "pid": 4183442, "tid": 31331, "ts": 667115524078.688, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115524082.452, "dur": 84.589, + "args": { + "External id": 229919,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 30 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115524088.738, "dur": 38.442, + "args": { + "External id": 229920,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 31 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115524092.607, "dur": 6.843, + "args": { + "External id": 229921,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 32 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115524101.936, "dur": 24.958, + "args": { + "External id": 229922,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 33 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115524105.908, "dur": 20.413, + "args": { + "External id": 229923,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 34 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115524131.781, "dur": 4.253, + "args": { + "External id": 229924,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 35 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115524134.174, "dur": 1.546, + "args": { + "External id": 229925,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 36 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115524137.167, "dur": 28.984, + "args": { + "External id": 229926,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 37 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524182.791, "dur": 66.315, + "args": { + "External id": 229927,"Record function id": 0, "Sequence number": 2757952, "Fwd thread id": 1, "Ev Idx": 38 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524183.900, "dur": 59.968, + "args": { + "External id": 229928,"Sequence number": 2757952, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 39 + } + }, + { + "ph": "f", "id": 6, "pid": 4183442, "tid": 31331, "ts": 667115524183.900, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183442, "tid": 31331, + "ts": 667115524187.486, "dur": 56.124, + "args": { + "External id": 229929,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "3"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 40 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115524191.913, "dur": 21.605, + "args": { + "External id": 229930,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 41 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115524192.793, "dur": 3.130, + "args": { + "External id": 229931,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 42 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115524196.511, "dur": 16.735, + "args": { + "External id": 229932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 43 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115524199.444, "dur": 13.409, + "args": { + "External id": 229933,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 44 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115524217.337, "dur": 6.110, + "args": { + "External id": 229934,"Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 45 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115524221.585, "dur": 1.126, + "args": { + "External id": 229935,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 46 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115524224.336, "dur": 18.673, + "args": { + "External id": 229936,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 47 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524252.908, "dur": 96.216, + "args": { + "External id": 229937,"Record function id": 0, "Sequence number": 2757951, "Fwd thread id": 1, "Ev Idx": 48 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524253.893, "dur": 90.495, + "args": { + "External id": 229938,"Sequence number": 2757951, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 49 + } + }, + { + "ph": "f", "id": 7, "pid": 4183442, "tid": 31331, "ts": 667115524253.893, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115524256.853, "dur": 87.191, + "args": { + "External id": 229939,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 50 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115524259.837, "dur": 18.481, + "args": { + "External id": 229940,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 51 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115524260.611, "dur": 2.444, + "args": { + "External id": 229941,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 52 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115524263.628, "dur": 14.434, + "args": { + "External id": 229942,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 53 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115524264.447, "dur": 13.268, + "args": { + "External id": 229943,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 54 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115524281.074, "dur": 2.087, + "args": { + "External id": 229944,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 55 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115524282.236, "dur": 0.741, + "args": { + "External id": 229945,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 56 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115524283.940, "dur": 59.408, + "args": { + "External id": 229946,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 57 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524353.229, "dur": 66.485, + "args": { + "External id": 229947,"Record function id": 0, "Sequence number": 2757950, "Fwd thread id": 1, "Ev Idx": 58 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524354.102, "dur": 61.765, + "args": { + "External id": 229948,"Sequence number": 2757950, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 59 + } + }, + { + "ph": "f", "id": 8, "pid": 4183442, "tid": 31331, "ts": 667115524354.102, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115524355.331, "dur": 60.271, + "args": { + "External id": 229949,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 60 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115524357.811, "dur": 16.324, + "args": { + "External id": 229950,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 61 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115524358.562, "dur": 3.885, + "args": { + "External id": 229951,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 62 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115524363.049, "dur": 10.849, + "args": { + "External id": 229952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 63 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115524363.996, "dur": 9.573, + "args": { + "External id": 229953,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 64 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115524375.008, "dur": 3.330, + "args": { + "External id": 229954,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 65 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115524377.749, "dur": 0.407, + "args": { + "External id": 229955,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 66 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115524380.470, "dur": 34.631, + "args": { + "External id": 229956,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 67 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524423.854, "dur": 38.109, + "args": { + "External id": 229957,"Record function id": 0, "Sequence number": 2757949, "Fwd thread id": 1, "Ev Idx": 68 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115524425.911, "dur": 0.985, + "args": { + "External id": 229958,"Sequence number": 2757949, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 69 + } + }, + { + "ph": "f", "id": 9, "pid": 4183442, "tid": 31331, "ts": 667115524425.911, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115524429.142, "dur": 27.915, + "args": { + "External id": 229959,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 70 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115524431.204, "dur": 25.359, + "args": { + "External id": 229960,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 71 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115524437.433, "dur": 2.010, + "args": { + "External id": 229961,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 72 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115524467.004, "dur": 1105.670, + "args": { + "External id": 229962,"Record function id": 0, "Sequence number": 2757947, "Fwd thread id": 1, "Ev Idx": 73 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115524468.418, "dur": 1067.834, + "args": { + "External id": 229963,"Sequence number": 2757947, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 74 + } + }, + { + "ph": "f", "id": 10, "pid": 4183442, "tid": 31331, "ts": 667115524468.418, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115524516.900, "dur": 2.909, + "args": { + "External id": 229964,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 75 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115524522.462, "dur": 914.732, + "args": { + "External id": 229965,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 76 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115524524.220, "dur": 912.739, + "args": { + "External id": 229966,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 77 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115524526.885, "dur": 6.033, + "args": { + "External id": 229967,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 78 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115524534.056, "dur": 901.812, + "args": { + "External id": 229968,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 79 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183442, "tid": 31331, + "ts": 667115525440.360, "dur": 0.361, + "args": { + "External id": 229969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 80 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183442, "tid": 31331, + "ts": 667115525441.921, "dur": 4.103, + "args": { + "External id": 229970,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 81 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183442, "tid": 31331, + "ts": 667115525445.090, "dur": 0.798, + "args": { + "External id": 229971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 82 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 31331, + "ts": 667115525449.728, "dur": 20.906, + "args": { + "External id": 229972,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 83 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183442, "tid": 31331, + "ts": 667115525476.058, "dur": 52.974, + "args": { + "External id": 229973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 84 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 31331, + "ts": 667115525477.400, "dur": 51.437, + "args": { + "External id": 229974,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 85 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 31331, + "ts": 667115525478.441, "dur": 49.770, + "args": { + "External id": 229975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 86 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115525547.421, "dur": 20.889, + "args": { + "External id": 229976,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 87 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525580.480, "dur": 15.955, + "args": { + "External id": 229977,"Record function id": 0, "Sequence number": 2757946, "Fwd thread id": 1, "Ev Idx": 88 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525581.694, "dur": 11.302, + "args": { + "External id": 229978,"Sequence number": 2757946, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 89 + } + }, + { + "ph": "f", "id": 11, "pid": 4183442, "tid": 31331, "ts": 667115525581.694, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115525585.965, "dur": 6.838, + "args": { + "External id": 229979,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 90 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115525589.124, "dur": 3.536, + "args": { + "External id": 229980,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 91 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525599.712, "dur": 89.771, + "args": { + "External id": 229981,"Record function id": 0, "Sequence number": 2757945, "Fwd thread id": 1, "Ev Idx": 92 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525600.884, "dur": 81.187, + "args": { + "External id": 229982,"Sequence number": 2757945, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 93 + } + }, + { + "ph": "f", "id": 12, "pid": 4183442, "tid": 31331, "ts": 667115525600.884, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115525602.471, "dur": 79.060, + "args": { + "External id": 229983,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 94 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115525606.178, "dur": 20.422, + "args": { + "External id": 229984,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 95 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115525607.499, "dur": 3.143, + "args": { + "External id": 229985,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 96 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115525611.452, "dur": 14.899, + "args": { + "External id": 229986,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 97 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115525612.524, "dur": 13.275, + "args": { + "External id": 229987,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 98 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115525627.867, "dur": 4.249, + "args": { + "External id": 229988,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 99 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115525629.528, "dur": 2.357, + "args": { + "External id": 229989,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115525633.051, "dur": 47.340, + "args": { + "External id": 229990,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525697.869, "dur": 57.972, + "args": { + "External id": 229991,"Record function id": 0, "Sequence number": 2757944, "Fwd thread id": 1, "Ev Idx": 102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525699.086, "dur": 52.573, + "args": { + "External id": 229992,"Sequence number": 2757944, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 103 + } + }, + { + "ph": "f", "id": 13, "pid": 4183442, "tid": 31331, "ts": 667115525699.086, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183442, "tid": 31331, + "ts": 667115525702.433, "dur": 48.884, + "args": { + "External id": 229993,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "2"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115525704.000, "dur": 20.557, + "args": { + "External id": 229994,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115525705.244, "dur": 3.064, + "args": { + "External id": 229995,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115525709.161, "dur": 15.134, + "args": { + "External id": 229996,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115525710.044, "dur": 13.780, + "args": { + "External id": 229997,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115525725.553, "dur": 7.116, + "args": { + "External id": 229998,"Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115525731.039, "dur": 1.078, + "args": { + "External id": 229999,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115525733.521, "dur": 17.318, + "args": { + "External id": 230000,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525759.739, "dur": 86.701, + "args": { + "External id": 230001,"Record function id": 0, "Sequence number": 2757943, "Fwd thread id": 1, "Ev Idx": 112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525760.720, "dur": 81.908, + "args": { + "External id": 230002,"Sequence number": 2757943, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 113 + } + }, + { + "ph": "f", "id": 14, "pid": 4183442, "tid": 31331, "ts": 667115525760.720, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115525762.299, "dur": 80.080, + "args": { + "External id": 230003,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115525763.514, "dur": 16.120, + "args": { + "External id": 230004,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115525764.341, "dur": 2.334, + "args": { + "External id": 230005,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115525767.323, "dur": 12.059, + "args": { + "External id": 230006,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115525768.236, "dur": 10.671, + "args": { + "External id": 230007,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115525780.806, "dur": 4.499, + "args": { + "External id": 230008,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115525784.205, "dur": 0.879, + "args": { + "External id": 230009,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115525785.942, "dur": 55.793, + "args": { + "External id": 230010,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525854.094, "dur": 77.675, + "args": { + "External id": 230011,"Record function id": 0, "Sequence number": 2757942, "Fwd thread id": 1, "Ev Idx": 122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525855.250, "dur": 57.084, + "args": { + "External id": 230012,"Sequence number": 2757942, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 123 + } + }, + { + "ph": "f", "id": 15, "pid": 4183442, "tid": 31331, "ts": 667115525855.250, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115525858.541, "dur": 53.561, + "args": { + "External id": 230013,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115525859.462, "dur": 14.087, + "args": { + "External id": 230014,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115525860.339, "dur": 1.942, + "args": { + "External id": 230015,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115525863.230, "dur": 10.079, + "args": { + "External id": 230016,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115525863.979, "dur": 8.961, + "args": { + "External id": 230017,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115525874.438, "dur": 1.713, + "args": { + "External id": 230018,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115525875.385, "dur": 0.574, + "args": { + "External id": 230019,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115525876.793, "dur": 34.802, + "args": { + "External id": 230020,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115525915.984, "dur": 14.589, + "args": { + "External id": 230021,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525936.058, "dur": 35.049, + "args": { + "External id": 230022,"Record function id": 0, "Sequence number": 2757941, "Fwd thread id": 1, "Ev Idx": 133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115525939.323, "dur": 1.027, + "args": { + "External id": 230023,"Sequence number": 2757941, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 134 + } + }, + { + "ph": "f", "id": 16, "pid": 4183442, "tid": 31331, "ts": 667115525939.323, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115525942.783, "dur": 24.794, + "args": { + "External id": 230024,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115525944.287, "dur": 22.859, + "args": { + "External id": 230025,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115525949.136, "dur": 2.582, + "args": { + "External id": 230026,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115525976.054, "dur": 1450.782, + "args": { + "External id": 230027,"Record function id": 0, "Sequence number": 2757939, "Fwd thread id": 1, "Ev Idx": 138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115525978.809, "dur": 1422.324, + "args": { + "External id": 230028,"Sequence number": 2757939, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 139 + } + }, + { + "ph": "f", "id": 17, "pid": 4183442, "tid": 31331, "ts": 667115525978.809, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115526006.251, "dur": 2.176, + "args": { + "External id": 230029,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115526010.403, "dur": 1310.133, + "args": { + "External id": 230030,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115526011.721, "dur": 1308.572, + "args": { + "External id": 230031,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115526013.922, "dur": 3.192, + "args": { + "External id": 230032,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115526018.038, "dur": 1301.289, + "args": { + "External id": 230033,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183442, "tid": 31331, + "ts": 667115527323.338, "dur": 0.289, + "args": { + "External id": 230034,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183442, "tid": 31331, + "ts": 667115527324.714, "dur": 2.132, + "args": { + "External id": 230035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183442, "tid": 31331, + "ts": 667115527325.846, "dur": 0.871, + "args": { + "External id": 230036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 31331, + "ts": 667115527329.929, "dur": 19.412, + "args": { + "External id": 230037,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183442, "tid": 31331, + "ts": 667115527358.163, "dur": 36.258, + "args": { + "External id": 230038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 31331, + "ts": 667115527358.951, "dur": 35.280, + "args": { + "External id": 230039,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 31331, + "ts": 667115527360.082, "dur": 33.717, + "args": { + "External id": 230040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115527408.880, "dur": 14.042, + "args": { + "External id": 230041,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527433.765, "dur": 10.821, + "args": { + "External id": 230042,"Record function id": 0, "Sequence number": 2757938, "Fwd thread id": 1, "Ev Idx": 153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527435.239, "dur": 6.115, + "args": { + "External id": 230043,"Sequence number": 2757938, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 154 + } + }, + { + "ph": "f", "id": 18, "pid": 4183442, "tid": 31331, "ts": 667115527435.239, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115527437.369, "dur": 3.803, + "args": { + "External id": 230044,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115527438.428, "dur": 2.620, + "args": { + "External id": 230045,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527447.865, "dur": 75.939, + "args": { + "External id": 230046,"Record function id": 0, "Sequence number": 2757937, "Fwd thread id": 1, "Ev Idx": 157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527449.165, "dur": 67.556, + "args": { + "External id": 230047,"Sequence number": 2757937, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 158 + } + }, + { + "ph": "f", "id": 19, "pid": 4183442, "tid": 31331, "ts": 667115527449.165, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115527452.067, "dur": 64.184, + "args": { + "External id": 230048,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115527456.125, "dur": 18.658, + "args": { + "External id": 230049,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115527457.236, "dur": 2.388, + "args": { + "External id": 230050,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115527460.528, "dur": 14.024, + "args": { + "External id": 230051,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115527461.770, "dur": 12.299, + "args": { + "External id": 230052,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115527476.116, "dur": 3.863, + "args": { + "External id": 230053,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115527478.775, "dur": 0.990, + "args": { + "External id": 230054,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115527480.957, "dur": 34.232, + "args": { + "External id": 230055,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527529.636, "dur": 51.035, + "args": { + "External id": 230056,"Record function id": 0, "Sequence number": 2757936, "Fwd thread id": 1, "Ev Idx": 167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527531.024, "dur": 46.200, + "args": { + "External id": 230057,"Sequence number": 2757936, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 168 + } + }, + { + "ph": "f", "id": 20, "pid": 4183442, "tid": 31331, "ts": 667115527531.024, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183442, "tid": 31331, + "ts": 667115527533.084, "dur": 43.902, + "args": { + "External id": 230058,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115527534.567, "dur": 19.529, + "args": { + "External id": 230059,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115527537.400, "dur": 2.504, + "args": { + "External id": 230060,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115527540.713, "dur": 13.143, + "args": { + "External id": 230061,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115527541.429, "dur": 12.041, + "args": { + "External id": 230062,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115527555.310, "dur": 7.054, + "args": { + "External id": 230063,"Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115527559.313, "dur": 2.509, + "args": { + "External id": 230064,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115527563.137, "dur": 13.430, + "args": { + "External id": 230065,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527584.754, "dur": 101.276, + "args": { + "External id": 230066,"Record function id": 0, "Sequence number": 2757935, "Fwd thread id": 1, "Ev Idx": 177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527585.604, "dur": 95.910, + "args": { + "External id": 230067,"Sequence number": 2757935, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 178 + } + }, + { + "ph": "f", "id": 21, "pid": 4183442, "tid": 31331, "ts": 667115527585.604, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115527586.879, "dur": 94.263, + "args": { + "External id": 230068,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115527587.987, "dur": 20.646, + "args": { + "External id": 230069,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115527590.608, "dur": 1.886, + "args": { + "External id": 230070,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115527593.228, "dur": 15.134, + "args": { + "External id": 230071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115527593.977, "dur": 13.911, + "args": { + "External id": 230072,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115527609.837, "dur": 3.088, + "args": { + "External id": 230073,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115527612.112, "dur": 0.596, + "args": { + "External id": 230074,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115527613.753, "dur": 66.121, + "args": { + "External id": 230075,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527692.063, "dur": 89.787, + "args": { + "External id": 230076,"Record function id": 0, "Sequence number": 2757934, "Fwd thread id": 1, "Ev Idx": 187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527693.165, "dur": 68.639, + "args": { + "External id": 230077,"Sequence number": 2757934, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 188 + } + }, + { + "ph": "f", "id": 22, "pid": 4183442, "tid": 31331, "ts": 667115527693.165, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115527696.685, "dur": 64.894, + "args": { + "External id": 230078,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115527697.937, "dur": 20.676, + "args": { + "External id": 230079,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115527700.839, "dur": 2.145, + "args": { + "External id": 230080,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115527703.808, "dur": 14.538, + "args": { + "External id": 230081,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115527704.690, "dur": 13.175, + "args": { + "External id": 230082,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115527719.369, "dur": 2.581, + "args": { + "External id": 230083,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115527721.156, "dur": 0.582, + "args": { + "External id": 230084,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115527722.522, "dur": 38.491, + "args": { + "External id": 230085,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115527764.896, "dur": 15.623, + "args": { + "External id": 230086,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527785.756, "dur": 32.107, + "args": { + "External id": 230087,"Record function id": 0, "Sequence number": 2757933, "Fwd thread id": 1, "Ev Idx": 198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115527786.772, "dur": 1.231, + "args": { + "External id": 230088,"Sequence number": 2757933, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 199 + } + }, + { + "ph": "f", "id": 23, "pid": 4183442, "tid": 31331, "ts": 667115527786.772, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115527789.791, "dur": 22.210, + "args": { + "External id": 230089,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115527791.226, "dur": 20.405, + "args": { + "External id": 230090,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115527795.453, "dur": 0.543, + "args": { + "External id": 230091,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115527821.810, "dur": 1450.113, + "args": { + "External id": 230092,"Record function id": 0, "Sequence number": 2757932, "Fwd thread id": 1, "Ev Idx": 203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115527833.932, "dur": 1408.213, + "args": { + "External id": 230093,"Sequence number": 2757932, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 204 + } + }, + { + "ph": "f", "id": 24, "pid": 4183442, "tid": 31331, "ts": 667115527833.932, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115527859.254, "dur": 1.985, + "args": { + "External id": 230094,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115527863.312, "dur": 1297.671, + "args": { + "External id": 230095,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115527864.421, "dur": 1296.285, + "args": { + "External id": 230096,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115527867.602, "dur": 2.870, + "args": { + "External id": 230097,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115527871.387, "dur": 1288.174, + "args": { + "External id": 230098,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183442, "tid": 31331, + "ts": 667115529163.861, "dur": 0.270, + "args": { + "External id": 230099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183442, "tid": 31331, + "ts": 667115529165.153, "dur": 1.908, + "args": { + "External id": 230100,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183442, "tid": 31331, + "ts": 667115529166.187, "dur": 0.690, + "args": { + "External id": 230101,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 31331, + "ts": 667115529170.032, "dur": 22.101, + "args": { + "External id": 230102,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183442, "tid": 31331, + "ts": 667115529196.186, "dur": 39.799, + "args": { + "External id": 230103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 31331, + "ts": 667115529197.090, "dur": 38.700, + "args": { + "External id": 230104,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 31331, + "ts": 667115529198.060, "dur": 37.354, + "args": { + "External id": 230105,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115529251.854, "dur": 15.813, + "args": { + "External id": 230106,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115529284.697, "dur": 12.429, + "args": { + "External id": 230107,"Record function id": 0, "Ev Idx": 218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115529287.302, "dur": 8.200, + "args": { + "External id": 230108,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115529290.478, "dur": 3.932, + "args": { + "External id": 230109,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115529291.254, "dur": 3.035, + "args": { + "External id": 230110,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529302.583, "dur": 11.835, + "args": { + "External id": 230111,"Record function id": 0, "Sequence number": 2757931, "Fwd thread id": 1, "Ev Idx": 222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529303.958, "dur": 7.417, + "args": { + "External id": 230112,"Sequence number": 2757931, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 223 + } + }, + { + "ph": "f", "id": 25, "pid": 4183442, "tid": 31331, "ts": 667115529303.958, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115529306.282, "dur": 4.848, + "args": { + "External id": 230113,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115529308.435, "dur": 2.576, + "args": { + "External id": 230114,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529317.620, "dur": 59.729, + "args": { + "External id": 230115,"Record function id": 0, "Sequence number": 2757930, "Fwd thread id": 1, "Ev Idx": 226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529318.835, "dur": 53.103, + "args": { + "External id": 230116,"Sequence number": 2757930, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 227 + } + }, + { + "ph": "f", "id": 26, "pid": 4183442, "tid": 31331, "ts": 667115529318.835, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115529320.452, "dur": 51.108, + "args": { + "External id": 230117,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115529323.873, "dur": 20.585, + "args": { + "External id": 230118,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115529325.137, "dur": 2.874, + "args": { + "External id": 230119,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115529328.919, "dur": 15.262, + "args": { + "External id": 230120,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115529330.150, "dur": 13.550, + "args": { + "External id": 230121,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115529345.694, "dur": 3.889, + "args": { + "External id": 230122,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115529348.366, "dur": 1.023, + "args": { + "External id": 230123,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115529350.336, "dur": 20.532, + "args": { + "External id": 230124,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529381.028, "dur": 53.082, + "args": { + "External id": 230125,"Record function id": 0, "Sequence number": 2757929, "Fwd thread id": 1, "Ev Idx": 236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529382.073, "dur": 48.759, + "args": { + "External id": 230126,"Sequence number": 2757929, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 237 + } + }, + { + "ph": "f", "id": 27, "pid": 4183442, "tid": 31331, "ts": 667115529382.073, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183442, "tid": 31331, + "ts": 667115529383.662, "dur": 46.925, + "args": { + "External id": 230127,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115529385.302, "dur": 20.818, + "args": { + "External id": 230128,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115529390.642, "dur": 2.275, + "args": { + "External id": 230129,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115529393.475, "dur": 12.395, + "args": { + "External id": 230130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115529394.445, "dur": 11.088, + "args": { + "External id": 230131,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115529407.264, "dur": 3.944, + "args": { + "External id": 230132,"Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115529410.024, "dur": 0.678, + "args": { + "External id": 230133,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115529411.747, "dur": 18.420, + "args": { + "External id": 230134,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529437.939, "dur": 87.974, + "args": { + "External id": 230135,"Record function id": 0, "Sequence number": 2757928, "Fwd thread id": 1, "Ev Idx": 246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529439.183, "dur": 82.917, + "args": { + "External id": 230136,"Sequence number": 2757928, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 247 + } + }, + { + "ph": "f", "id": 28, "pid": 4183442, "tid": 31331, "ts": 667115529439.183, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115529440.168, "dur": 81.540, + "args": { + "External id": 230137,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115529442.346, "dur": 18.344, + "args": { + "External id": 230138,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115529444.268, "dur": 2.475, + "args": { + "External id": 230139,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115529447.384, "dur": 13.066, + "args": { + "External id": 230140,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115529448.227, "dur": 11.857, + "args": { + "External id": 230141,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115529461.625, "dur": 4.328, + "args": { + "External id": 230142,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115529462.839, "dur": 2.956, + "args": { + "External id": 230143,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115529466.531, "dur": 54.259, + "args": { + "External id": 230144,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529531.808, "dur": 89.325, + "args": { + "External id": 230145,"Record function id": 0, "Sequence number": 2757927, "Fwd thread id": 1, "Ev Idx": 256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115529533.037, "dur": 70.220, + "args": { + "External id": 230146,"Sequence number": 2757927, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 257 + } + }, + { + "ph": "f", "id": 29, "pid": 4183442, "tid": 31331, "ts": 667115529533.037, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183442, "tid": 31331, + "ts": 667115529534.502, "dur": 68.519, + "args": { + "External id": 230147,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 31331, + "ts": 667115529535.631, "dur": 25.481, + "args": { + "External id": 230148,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115529540.910, "dur": 2.107, + "args": { + "External id": 230149,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 31331, + "ts": 667115529546.459, "dur": 14.396, + "args": { + "External id": 230150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 31331, + "ts": 667115529548.932, "dur": 11.576, + "args": { + "External id": 230151,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115529561.925, "dur": 1.994, + "args": { + "External id": 230152,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115529563.000, "dur": 0.737, + "args": { + "External id": 230153,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115529564.621, "dur": 37.767, + "args": { + "External id": 230154,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115529606.581, "dur": 12.775, + "args": { + "External id": 230155,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115529626.549, "dur": 382.114, + "args": { + "External id": 230156,"Record function id": 0, "Sequence number": 2757926, "Fwd thread id": 1, "Ev Idx": 267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115529627.721, "dur": 369.483, + "args": { + "External id": 230157,"Sequence number": 2757926, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 268 + } + }, + { + "ph": "f", "id": 30, "pid": 4183442, "tid": 31331, "ts": 667115529627.721, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115529828.851, "dur": 46.736, + "args": { + "External id": 230158,"kernel_hash": "c7hlzswdkogbe64wv2ovun6qprl5bfv2jkt7tamjc4frov6vf2kj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "262144", "1024", "1", "1986", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/7h/c7hlzswdkogbe64wv2ovun6qprl5bfv2jkt7tamjc4frov6vf2kj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 1024], [1024], [262144, 1024], [262144, 1024], [132, 1024], [262144], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_0", "pid": 4183442, "tid": 31331, + "ts": 667115529909.649, "dur": 26.693, + "args": { + "External id": 230159,"kernel_hash": "cii7bbv55hb3nctitgnfwrqgey5cb5renzwhxwkpcumbkexcm57j", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/ii/cii7bbv55hb3nctitgnfwrqgey5cb5renzwhxwkpcumbkexcm57j.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_1", "pid": 4183442, "tid": 31331, + "ts": 667115529953.978, "dur": 19.685, + "args": { + "External id": 230160,"kernel_hash": "crtgea2ng3an5hbp6paxzlkoogoerxlxvelprieartk62pibpe4e", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/rt/crtgea2ng3an5hbp6paxzlkoogoerxlxvelprieartk62pibpe4e.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115530019.098, "dur": 11.726, + "args": { + "External id": 230161,"Record function id": 0, "Ev Idx": 272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115530021.107, "dur": 8.840, + "args": { + "External id": 230162,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115530024.064, "dur": 5.004, + "args": { + "External id": 230163,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115530026.030, "dur": 2.921, + "args": { + "External id": 230164,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: StackBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530034.607, "dur": 33.265, + "args": { + "External id": 230165,"Record function id": 0, "Sequence number": 2757925, "Fwd thread id": 1, "Ev Idx": 276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "StackBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530035.998, "dur": 21.682, + "args": { + "External id": 230166,"Sequence number": 2757925, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 277 + } + }, + { + "ph": "f", "id": 31, "pid": 4183442, "tid": 31331, "ts": 667115530035.998, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115530038.334, "dur": 7.710, + "args": { + "External id": 230167,"Record function id": 0, "Concrete Inputs": ["", "-2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530043.281, "dur": 1.077, + "args": { + "External id": 230168,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115530046.714, "dur": 3.590, + "args": { + "External id": 230169,"Record function id": 0, "Concrete Inputs": ["", "-2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530049.209, "dur": 0.333, + "args": { + "External id": 230170,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115530050.941, "dur": 2.119, + "args": { + "External id": 230171,"Record function id": 0, "Concrete Inputs": ["", "-2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530051.885, "dur": 0.512, + "args": { + "External id": 230172,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 31331, + "ts": 667115530053.813, "dur": 3.401, + "args": { + "External id": 230173,"Record function id": 0, "Concrete Inputs": ["", "-2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530055.971, "dur": 0.374, + "args": { + "External id": 230174,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530071.457, "dur": 7.605, + "args": { + "External id": 230175,"Record function id": 0, "Sequence number": 2757924, "Fwd thread id": 1, "Ev Idx": 286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530072.510, "dur": 1.126, + "args": { + "External id": 230176,"Sequence number": 2757924, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 287 + } + }, + { + "ph": "f", "id": 32, "pid": 4183442, "tid": 31331, "ts": 667115530072.510, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115530082.866, "dur": 494.029, + "args": { + "External id": 230177,"Record function id": 0, "Sequence number": 2757923, "Fwd thread id": 1, "Ev Idx": 288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115530084.083, "dur": 476.867, + "args": { + "External id": 230178,"Sequence number": 2757923, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 289 + } + }, + { + "ph": "f", "id": 33, "pid": 4183442, "tid": 31331, "ts": 667115530084.083, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530121.902, "dur": 11.540, + "args": { + "External id": 230179,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115530129.050, "dur": 4.034, + "args": { + "External id": 230180,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530138.369, "dur": 9.859, + "args": { + "External id": 230181,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530141.781, "dur": 5.561, + "args": { + "External id": 230182,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530144.862, "dur": 2.258, + "args": { + "External id": 230183,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 31331, + "ts": 667115530152.554, "dur": 118.020, + "args": { + "External id": 230184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530153.357, "dur": 4.672, + "args": { + "External id": 230185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530154.009, "dur": 3.165, + "args": { + "External id": 230186,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530156.491, "dur": 0.610, + "args": { + "External id": 230187,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 31331, + "ts": 667115530160.179, "dur": 109.464, + "args": { + "External id": 230188,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115530162.986, "dur": 105.506, + "args": { + "External id": 230189,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115530278.388, "dur": 4.189, + "args": { + "External id": 230190,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530279.792, "dur": 2.664, + "args": { + "External id": 230191,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115530317.124, "dur": 6.528, + "args": { + "External id": 230192,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115530324.602, "dur": 1.724, + "args": { + "External id": 230193,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115530327.963, "dur": 1.904, + "args": { + "External id": 230194,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530366.932, "dur": 2.378, + "args": { + "External id": 230195,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530367.666, "dur": 1.476, + "args": { + "External id": 230196,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183442, "tid": 31331, + "ts": 667115530393.349, "dur": 145.937, + "args": { + "External id": 230197,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115530398.943, "dur": 10.179, + "args": { + "External id": 230198,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530404.021, "dur": 2.813, + "args": { + "External id": 230199,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115530411.100, "dur": 5.870, + "args": { + "External id": 230200,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530415.332, "dur": 0.515, + "args": { + "External id": 230201,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115530418.359, "dur": 2.182, + "args": { + "External id": 230202,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530419.676, "dur": 0.515, + "args": { + "External id": 230203,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115530421.769, "dur": 3.358, + "args": { + "External id": 230204,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530423.760, "dur": 0.604, + "args": { + "External id": 230205,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115530430.836, "dur": 2.858, + "args": { + "External id": 230206,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530432.824, "dur": 0.497, + "args": { + "External id": 230207,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530434.956, "dur": 5.542, + "args": { + "External id": 230208,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115530438.631, "dur": 1.647, + "args": { + "External id": 230209,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115530441.591, "dur": 3.371, + "args": { + "External id": 230210,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530444.125, "dur": 0.561, + "args": { + "External id": 230211,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530445.787, "dur": 2.585, + "args": { + "External id": 230212,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530446.953, "dur": 1.329, + "args": { + "External id": 230213,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115530450.202, "dur": 75.087, + "args": { + "External id": 230214,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530528.398, "dur": 1.785, + "args": { + "External id": 230215,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115530531.536, "dur": 3.491, + "args": { + "External id": 230216,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530533.916, "dur": 0.506, + "args": { + "External id": 230217,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530537.066, "dur": 0.885, + "args": { + "External id": 230218,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115530588.528, "dur": 10.020, + "args": { + "External id": 230219,"Record function id": 0, "Ev Idx": 330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115530590.711, "dur": 7.107, + "args": { + "External id": 230220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115530593.315, "dur": 3.611, + "args": { + "External id": 230221,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115530594.359, "dur": 2.475, + "args": { + "External id": 230222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530602.641, "dur": 9.286, + "args": { + "External id": 230223,"Record function id": 0, "Sequence number": 2757922, "Fwd thread id": 1, "Ev Idx": 334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530604.016, "dur": 4.132, + "args": { + "External id": 230224,"Sequence number": 2757922, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 335 + } + }, + { + "ph": "f", "id": 34, "pid": 4183442, "tid": 31331, "ts": 667115530604.016, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530605.893, "dur": 2.082, + "args": { + "External id": 230225,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530606.948, "dur": 0.880, + "args": { + "External id": 230226,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530615.941, "dur": 169.689, + "args": { + "External id": 230227,"Record function id": 0, "Sequence number": 2757921, "Fwd thread id": 1, "Ev Idx": 338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530618.382, "dur": 157.705, + "args": { + "External id": 230228,"Sequence number": 2757921, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 339 + } + }, + { + "ph": "f", "id": 35, "pid": 4183442, "tid": 31331, "ts": 667115530618.382, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530622.674, "dur": 4.800, + "args": { + "External id": 230229,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530624.381, "dur": 2.486, + "args": { + "External id": 230230,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530626.033, "dur": 0.650, + "args": { + "External id": 230231,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115530628.896, "dur": 82.256, + "args": { + "External id": 230232,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530713.642, "dur": 6.807, + "args": { + "External id": 230233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530714.610, "dur": 4.958, + "args": { + "External id": 230234,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530718.323, "dur": 1.046, + "args": { + "External id": 230235,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530722.700, "dur": 5.190, + "args": { + "External id": 230236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530723.838, "dur": 3.584, + "args": { + "External id": 230237,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530725.205, "dur": 2.156, + "args": { + "External id": 230238,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115530728.680, "dur": 46.396, + "args": { + "External id": 230239,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530791.641, "dur": 10.161, + "args": { + "External id": 230240,"Record function id": 0, "Sequence number": 2757920, "Fwd thread id": 1, "Ev Idx": 351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530792.999, "dur": 6.898, + "args": { + "External id": 230241,"Sequence number": 2757920, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 352 + } + }, + { + "ph": "f", "id": 36, "pid": 4183442, "tid": 31331, "ts": 667115530792.999, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530794.933, "dur": 4.793, + "args": { + "External id": 230242,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530798.098, "dur": 1.531, + "args": { + "External id": 230243,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530805.703, "dur": 10.419, + "args": { + "External id": 230244,"Record function id": 0, "Sequence number": 2757919, "Fwd thread id": 1, "Ev Idx": 355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530806.740, "dur": 5.181, + "args": { + "External id": 230245,"Sequence number": 2757919, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 356 + } + }, + { + "ph": "f", "id": 37, "pid": 4183442, "tid": 31331, "ts": 667115530806.740, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530807.668, "dur": 4.042, + "args": { + "External id": 230246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530808.601, "dur": 2.551, + "args": { + "External id": 230247,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530810.280, "dur": 0.756, + "args": { + "External id": 230248,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115530820.451, "dur": 6.271, + "args": { + "External id": 230249,"Record function id": 0, "Ev Idx": 360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115530822.293, "dur": 3.827, + "args": { + "External id": 230250,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115530823.388, "dur": 2.430, + "args": { + "External id": 230251,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115530824.089, "dur": 1.633, + "args": { + "External id": 230252,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530830.174, "dur": 9.046, + "args": { + "External id": 230253,"Record function id": 0, "Sequence number": 2757918, "Fwd thread id": 1, "Ev Idx": 364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530831.784, "dur": 4.605, + "args": { + "External id": 230254,"Sequence number": 2757918, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 365 + } + }, + { + "ph": "f", "id": 38, "pid": 4183442, "tid": 31331, "ts": 667115530831.784, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530834.681, "dur": 1.570, + "args": { + "External id": 230255,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530835.337, "dur": 0.821, + "args": { + "External id": 230256,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530843.811, "dur": 99.885, + "args": { + "External id": 230257,"Record function id": 0, "Sequence number": 2757917, "Fwd thread id": 1, "Ev Idx": 368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530844.624, "dur": 88.045, + "args": { + "External id": 230258,"Sequence number": 2757917, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 369 + } + }, + { + "ph": "f", "id": 39, "pid": 4183442, "tid": 31331, "ts": 667115530844.624, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530848.012, "dur": 5.567, + "args": { + "External id": 230259,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530848.813, "dur": 4.298, + "args": { + "External id": 230260,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530852.390, "dur": 0.590, + "args": { + "External id": 230261,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115530854.204, "dur": 26.025, + "args": { + "External id": 230262,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530881.364, "dur": 5.316, + "args": { + "External id": 230263,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530881.824, "dur": 4.359, + "args": { + "External id": 230264,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530883.353, "dur": 2.708, + "args": { + "External id": 230265,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530888.009, "dur": 4.677, + "args": { + "External id": 230266,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530888.893, "dur": 3.379, + "args": { + "External id": 230267,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530891.735, "dur": 0.469, + "args": { + "External id": 230268,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115530893.437, "dur": 38.329, + "args": { + "External id": 230269,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530948.675, "dur": 34.108, + "args": { + "External id": 230270,"Record function id": 0, "Sequence number": 2757916, "Fwd thread id": 1, "Ev Idx": 381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530949.764, "dur": 4.403, + "args": { + "External id": 230271,"Sequence number": 2757916, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 382 + } + }, + { + "ph": "f", "id": 40, "pid": 4183442, "tid": 31331, "ts": 667115530949.764, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115530951.626, "dur": 2.397, + "args": { + "External id": 230272,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115530952.765, "dur": 1.119, + "args": { + "External id": 230273,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115530957.551, "dur": 22.446, + "args": { + "External id": 230274,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530986.606, "dur": 11.170, + "args": { + "External id": 230275,"Record function id": 0, "Sequence number": 2757915, "Fwd thread id": 1, "Ev Idx": 386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115530987.685, "dur": 6.765, + "args": { + "External id": 230276,"Sequence number": 2757915, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 387 + } + }, + { + "ph": "f", "id": 41, "pid": 4183442, "tid": 31331, "ts": 667115530987.685, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115530990.948, "dur": 3.302, + "args": { + "External id": 230277,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115530991.777, "dur": 1.968, + "args": { + "External id": 230278,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115530993.185, "dur": 0.436, + "args": { + "External id": 230279,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115531002.076, "dur": 5.632, + "args": { + "External id": 230280,"Record function id": 0, "Ev Idx": 391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115531003.963, "dur": 3.189, + "args": { + "External id": 230281,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115531004.855, "dur": 1.888, + "args": { + "External id": 230282,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115531005.557, "dur": 1.052, + "args": { + "External id": 230283,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115531012.021, "dur": 435.804, + "args": { + "External id": 230284,"Record function id": 0, "Sequence number": 2757914, "Fwd thread id": 1, "Ev Idx": 395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115531013.573, "dur": 416.517, + "args": { + "External id": 230285,"Sequence number": 2757914, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 396 + } + }, + { + "ph": "f", "id": 42, "pid": 4183442, "tid": 31331, "ts": 667115531013.573, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 31331, + "ts": 667115531040.092, "dur": 35.312, + "args": { + "External id": 230286,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115531041.801, "dur": 33.346, + "args": { + "External id": 230287,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115531045.025, "dur": 6.087, + "args": { + "External id": 230288,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115531047.935, "dur": 2.581, + "args": { + "External id": 230289,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115531052.344, "dur": 22.372, + "args": { + "External id": 230290,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115531089.173, "dur": 3.859, + "args": { + "External id": 230291,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531089.999, "dur": 2.876, + "args": { + "External id": 230292,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115531096.947, "dur": 1.940, + "args": { + "External id": 230293,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531097.947, "dur": 0.851, + "args": { + "External id": 230294,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115531113.769, "dur": 2.155, + "args": { + "External id": 230295,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115531128.918, "dur": 3.020, + "args": { + "External id": 230296,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531324.470, "dur": 1.961, + "args": { + "External id": 230297,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115531330.883, "dur": 31.210, + "args": { + "External id": 230298,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531340.026, "dur": 0.959, + "args": { + "External id": 230299,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115531368.272, "dur": 28.072, + "args": { + "External id": 230300,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115531370.008, "dur": 26.120, + "args": { + "External id": 230301,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531374.386, "dur": 3.723, + "args": { + "External id": 230302,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115531381.292, "dur": 14.342, + "args": { + "External id": 230303,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115531400.722, "dur": 2.426, + "args": { + "External id": 230304,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531401.930, "dur": 1.080, + "args": { + "External id": 230305,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115531409.917, "dur": 4.297, + "args": { + "External id": 230306,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531411.317, "dur": 2.773, + "args": { + "External id": 230307,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115531416.659, "dur": 2.533, + "args": { + "External id": 230308,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531417.948, "dur": 1.152, + "args": { + "External id": 230309,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115531458.549, "dur": 8.787, + "args": { + "External id": 230310,"Record function id": 0, "Ev Idx": 421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115531460.905, "dur": 5.680, + "args": { + "External id": 230311,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115531462.644, "dur": 2.946, + "args": { + "External id": 230312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115531463.814, "dur": 1.631, + "args": { + "External id": 230313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531471.018, "dur": 8.288, + "args": { + "External id": 230314,"Record function id": 0, "Sequence number": 2757913, "Fwd thread id": 1, "Ev Idx": 425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531472.360, "dur": 3.668, + "args": { + "External id": 230315,"Sequence number": 2757913, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 426 + } + }, + { + "ph": "f", "id": 43, "pid": 4183442, "tid": 31331, "ts": 667115531472.360, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115531473.778, "dur": 2.077, + "args": { + "External id": 230316,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531474.634, "dur": 1.080, + "args": { + "External id": 230317,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531484.734, "dur": 164.949, + "args": { + "External id": 230318,"Record function id": 0, "Sequence number": 2757912, "Fwd thread id": 1, "Ev Idx": 429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531485.607, "dur": 156.833, + "args": { + "External id": 230319,"Sequence number": 2757912, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 430 + } + }, + { + "ph": "f", "id": 44, "pid": 4183442, "tid": 31331, "ts": 667115531485.607, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115531488.346, "dur": 25.930, + "args": { + "External id": 230320,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115531490.098, "dur": 23.281, + "args": { + "External id": 230321,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531511.693, "dur": 1.223, + "args": { + "External id": 230322,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115531515.608, "dur": 74.366, + "args": { + "External id": 230323,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115531591.822, "dur": 7.687, + "args": { + "External id": 230324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115531594.342, "dur": 4.447, + "args": { + "External id": 230325,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531596.349, "dur": 2.274, + "args": { + "External id": 230326,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115531601.333, "dur": 3.244, + "args": { + "External id": 230327,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115531602.207, "dur": 1.689, + "args": { + "External id": 230328,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531603.403, "dur": 0.430, + "args": { + "External id": 230329,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115531605.135, "dur": 36.330, + "args": { + "External id": 230330,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531694.988, "dur": 14.534, + "args": { + "External id": 230331,"Record function id": 0, "Sequence number": 2757911, "Fwd thread id": 1, "Ev Idx": 442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531696.631, "dur": 9.498, + "args": { + "External id": 230332,"Sequence number": 2757911, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 443 + } + }, + { + "ph": "f", "id": 45, "pid": 4183442, "tid": 31331, "ts": 667115531696.631, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115531700.523, "dur": 5.432, + "args": { + "External id": 230333,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531701.750, "dur": 4.013, + "args": { + "External id": 230334,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531712.919, "dur": 9.456, + "args": { + "External id": 230335,"Record function id": 0, "Sequence number": 2757910, "Fwd thread id": 1, "Ev Idx": 446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531714.168, "dur": 5.633, + "args": { + "External id": 230336,"Sequence number": 2757910, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 447 + } + }, + { + "ph": "f", "id": 46, "pid": 4183442, "tid": 31331, "ts": 667115531714.168, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115531715.666, "dur": 3.915, + "args": { + "External id": 230337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115531716.420, "dur": 2.683, + "args": { + "External id": 230338,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531718.477, "dur": 0.502, + "args": { + "External id": 230339,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115531726.792, "dur": 8.730, + "args": { + "External id": 230340,"Record function id": 0, "Ev Idx": 451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115531728.450, "dur": 6.510, + "args": { + "External id": 230341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115531730.219, "dur": 4.382, + "args": { + "External id": 230342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115531732.663, "dur": 1.818, + "args": { + "External id": 230343,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531738.520, "dur": 8.183, + "args": { + "External id": 230344,"Record function id": 0, "Sequence number": 2757909, "Fwd thread id": 1, "Ev Idx": 455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115531739.766, "dur": 4.315, + "args": { + "External id": 230345,"Sequence number": 2757909, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 456 + } + }, + { + "ph": "f", "id": 47, "pid": 4183442, "tid": 31331, "ts": 667115531739.766, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115531741.391, "dur": 2.532, + "args": { + "External id": 230346,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115531742.363, "dur": 1.412, + "args": { + "External id": 230347,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115531751.632, "dur": 312.162, + "args": { + "External id": 230348,"Record function id": 0, "Sequence number": 2757908, "Fwd thread id": 1, "Ev Idx": 459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115531753.295, "dur": 290.941, + "args": { + "External id": 230349,"Sequence number": 2757908, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 460 + } + }, + { + "ph": "f", "id": 48, "pid": 4183442, "tid": 31331, "ts": 667115531753.295, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115531772.619, "dur": 7.441, + "args": { + "External id": 230350,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531775.447, "dur": 4.147, + "args": { + "External id": 230351,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115531782.312, "dur": 3.642, + "args": { + "External id": 230352,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531783.793, "dur": 1.964, + "args": { + "External id": 230353,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115531787.474, "dur": 5.558, + "args": { + "External id": 230354,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115531789.374, "dur": 3.466, + "args": { + "External id": 230355,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115531822.587, "dur": 194.804, + "args": { + "External id": 230356,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115531916.923, "dur": 3.268, + "args": { + "External id": 230357,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115531922.215, "dur": 3.388, + "args": { + "External id": 230358,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115532031.368, "dur": 3.289, + "args": { + "External id": 230359,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115532037.706, "dur": 1.100, + "args": { + "External id": 230360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115532040.759, "dur": 0.816, + "args": { + "External id": 230361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115532071.268, "dur": 230.661, + "args": { + "External id": 230362,"Record function id": 0, "Sequence number": 2757907, "Fwd thread id": 1, "Ev Idx": 473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115532073.103, "dur": 221.234, + "args": { + "External id": 230363,"Sequence number": 2757907, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 474 + } + }, + { + "ph": "f", "id": 49, "pid": 4183442, "tid": 31331, "ts": 667115532073.103, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115532096.566, "dur": 40.504, + "args": { + "External id": 230364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532099.835, "dur": 2.476, + "args": { + "External id": 230365,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115532103.866, "dur": 32.475, + "args": { + "External id": 230366,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115532148.026, "dur": 4.224, + "args": { + "External id": 230367,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532149.604, "dur": 2.379, + "args": { + "External id": 230368,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115532308.975, "dur": 150.208, + "args": { + "External id": 230369,"Record function id": 0, "Sequence number": 2757906, "Fwd thread id": 1, "Ev Idx": 480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115532311.207, "dur": 141.396, + "args": { + "External id": 230370,"Sequence number": 2757906, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 481 + } + }, + { + "ph": "f", "id": 50, "pid": 4183442, "tid": 31331, "ts": 667115532311.207, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115532322.985, "dur": 28.275, + "args": { + "External id": 230371,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532325.383, "dur": 2.254, + "args": { + "External id": 230372,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115532328.721, "dur": 22.004, + "args": { + "External id": 230373,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115532358.552, "dur": 6.253, + "args": { + "External id": 230374,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532360.583, "dur": 3.950, + "args": { + "External id": 230375,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532465.136, "dur": 13.274, + "args": { + "External id": 230376,"Record function id": 0, "Sequence number": 2757905, "Fwd thread id": 1, "Ev Idx": 487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532466.355, "dur": 9.416, + "args": { + "External id": 230377,"Sequence number": 2757905, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 488 + } + }, + { + "ph": "f", "id": 51, "pid": 4183442, "tid": 31331, "ts": 667115532466.355, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115532468.503, "dur": 7.048, + "args": { + "External id": 230378,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115532470.376, "dur": 4.972, + "args": { + "External id": 230379,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532481.741, "dur": 7.453, + "args": { + "External id": 230380,"Record function id": 0, "Sequence number": 2757904, "Fwd thread id": 1, "Ev Idx": 491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532482.978, "dur": 4.036, + "args": { + "External id": 230381,"Sequence number": 2757904, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 492 + } + }, + { + "ph": "f", "id": 52, "pid": 4183442, "tid": 31331, "ts": 667115532482.978, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115532484.541, "dur": 2.318, + "args": { + "External id": 230382,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115532485.774, "dur": 0.950, + "args": { + "External id": 230383,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532513.333, "dur": 11.522, + "args": { + "External id": 230384,"Record function id": 0, "Sequence number": 2757903, "Fwd thread id": 1, "Ev Idx": 495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532516.813, "dur": 4.987, + "args": { + "External id": 230385,"Sequence number": 2757903, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 496 + } + }, + { + "ph": "f", "id": 53, "pid": 4183442, "tid": 31331, "ts": 667115532516.813, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115532518.542, "dur": 3.091, + "args": { + "External id": 230386,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115532519.853, "dur": 1.562, + "args": { + "External id": 230387,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532528.753, "dur": 7.408, + "args": { + "External id": 230388,"Record function id": 0, "Sequence number": 2757902, "Fwd thread id": 1, "Ev Idx": 499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532530.222, "dur": 3.408, + "args": { + "External id": 230389,"Sequence number": 2757902, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 500 + } + }, + { + "ph": "f", "id": 54, "pid": 4183442, "tid": 31331, "ts": 667115532530.222, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115532531.310, "dur": 2.153, + "args": { + "External id": 230390,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115532532.321, "dur": 1.048, + "args": { + "External id": 230391,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532539.439, "dur": 236.242, + "args": { + "External id": 230392,"Record function id": 0, "Sequence number": 2757901, "Fwd thread id": 1, "Ev Idx": 503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532540.614, "dur": 223.068, + "args": { + "External id": 230393,"Sequence number": 2757901, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 504 + } + }, + { + "ph": "f", "id": 55, "pid": 4183442, "tid": 31331, "ts": 667115532540.614, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532547.045, "dur": 6.491, + "args": { + "External id": 230394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532548.861, "dur": 4.034, + "args": { + "External id": 230395,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532551.107, "dur": 1.533, + "args": { + "External id": 230396,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115532555.028, "dur": 81.057, + "args": { + "External id": 230397,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532637.547, "dur": 6.934, + "args": { + "External id": 230398,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532638.130, "dur": 5.615, + "args": { + "External id": 230399,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532642.239, "dur": 1.330, + "args": { + "External id": 230400,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532707.041, "dur": 5.724, + "args": { + "External id": 230401,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532709.395, "dur": 2.603, + "args": { + "External id": 230402,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532711.184, "dur": 0.548, + "args": { + "External id": 230403,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115532713.584, "dur": 48.897, + "args": { + "External id": 230404,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532783.193, "dur": 7.563, + "args": { + "External id": 230405,"Record function id": 0, "Sequence number": 2757900, "Fwd thread id": 1, "Ev Idx": 516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532784.220, "dur": 4.611, + "args": { + "External id": 230406,"Sequence number": 2757900, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 517 + } + }, + { + "ph": "f", "id": 56, "pid": 4183442, "tid": 31331, "ts": 667115532784.220, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115532786.065, "dur": 2.588, + "args": { + "External id": 230407,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115532786.864, "dur": 1.670, + "args": { + "External id": 230408,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532794.153, "dur": 10.373, + "args": { + "External id": 230409,"Record function id": 0, "Sequence number": 2757899, "Fwd thread id": 1, "Ev Idx": 520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532797.136, "dur": 4.498, + "args": { + "External id": 230410,"Sequence number": 2757899, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 521 + } + }, + { + "ph": "f", "id": 57, "pid": 4183442, "tid": 31331, "ts": 667115532797.136, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532797.945, "dur": 3.494, + "args": { + "External id": 230411,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532798.709, "dur": 2.197, + "args": { + "External id": 230412,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532800.132, "dur": 0.642, + "args": { + "External id": 230413,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115532810.178, "dur": 9.442, + "args": { + "External id": 230414,"Record function id": 0, "Ev Idx": 525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115532812.190, "dur": 6.657, + "args": { + "External id": 230415,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115532814.650, "dur": 3.774, + "args": { + "External id": 230416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115532815.638, "dur": 2.649, + "args": { + "External id": 230417,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532825.149, "dur": 7.981, + "args": { + "External id": 230418,"Record function id": 0, "Sequence number": 2757898, "Fwd thread id": 1, "Ev Idx": 529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532826.581, "dur": 4.103, + "args": { + "External id": 230419,"Sequence number": 2757898, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 530 + } + }, + { + "ph": "f", "id": 58, "pid": 4183442, "tid": 31331, "ts": 667115532826.581, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115532827.635, "dur": 2.893, + "args": { + "External id": 230420,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115532829.560, "dur": 0.831, + "args": { + "External id": 230421,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532836.474, "dur": 100.793, + "args": { + "External id": 230422,"Record function id": 0, "Sequence number": 2757897, "Fwd thread id": 1, "Ev Idx": 533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532837.383, "dur": 93.028, + "args": { + "External id": 230423,"Sequence number": 2757897, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 534 + } + }, + { + "ph": "f", "id": 59, "pid": 4183442, "tid": 31331, "ts": 667115532837.383, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532839.903, "dur": 2.997, + "args": { + "External id": 230424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532840.337, "dur": 2.107, + "args": { + "External id": 230425,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532841.885, "dur": 0.421, + "args": { + "External id": 230426,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115532845.333, "dur": 39.254, + "args": { + "External id": 230427,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532885.753, "dur": 3.283, + "args": { + "External id": 230428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532886.282, "dur": 2.164, + "args": { + "External id": 230429,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532887.719, "dur": 0.621, + "args": { + "External id": 230430,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532890.357, "dur": 4.792, + "args": { + "External id": 230431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532891.176, "dur": 3.525, + "args": { + "External id": 230432,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532892.485, "dur": 2.130, + "args": { + "External id": 230433,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115532897.476, "dur": 32.138, + "args": { + "External id": 230434,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532941.540, "dur": 32.253, + "args": { + "External id": 230435,"Record function id": 0, "Sequence number": 2757896, "Fwd thread id": 1, "Ev Idx": 546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532942.537, "dur": 4.008, + "args": { + "External id": 230436,"Sequence number": 2757896, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 547 + } + }, + { + "ph": "f", "id": 60, "pid": 4183442, "tid": 31331, "ts": 667115532942.537, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115532944.237, "dur": 2.169, + "args": { + "External id": 230437,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115532945.229, "dur": 1.081, + "args": { + "External id": 230438,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115532949.533, "dur": 22.263, + "args": { + "External id": 230439,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532977.449, "dur": 9.569, + "args": { + "External id": 230440,"Record function id": 0, "Sequence number": 2757895, "Fwd thread id": 1, "Ev Idx": 551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115532978.502, "dur": 6.654, + "args": { + "External id": 230441,"Sequence number": 2757895, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 552 + } + }, + { + "ph": "f", "id": 61, "pid": 4183442, "tid": 31331, "ts": 667115532978.502, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115532979.328, "dur": 5.623, + "args": { + "External id": 230442,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115532981.979, "dur": 2.424, + "args": { + "External id": 230443,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115532983.891, "dur": 0.396, + "args": { + "External id": 230444,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115532991.004, "dur": 5.589, + "args": { + "External id": 230445,"Record function id": 0, "Ev Idx": 556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115532992.689, "dur": 3.328, + "args": { + "External id": 230446,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115532993.871, "dur": 1.768, + "args": { + "External id": 230447,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115532994.357, "dur": 1.185, + "args": { + "External id": 230448,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533000.616, "dur": 6.660, + "args": { + "External id": 230449,"Record function id": 0, "Sequence number": 2757894, "Fwd thread id": 1, "Ev Idx": 560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533002.116, "dur": 3.174, + "args": { + "External id": 230450,"Sequence number": 2757894, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 561 + } + }, + { + "ph": "f", "id": 62, "pid": 4183442, "tid": 31331, "ts": 667115533002.116, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533003.331, "dur": 1.813, + "args": { + "External id": 230451,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533004.189, "dur": 0.812, + "args": { + "External id": 230452,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533012.156, "dur": 94.865, + "args": { + "External id": 230453,"Record function id": 0, "Sequence number": 2757893, "Fwd thread id": 1, "Ev Idx": 564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533013.128, "dur": 85.235, + "args": { + "External id": 230454,"Sequence number": 2757893, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 565 + } + }, + { + "ph": "f", "id": 63, "pid": 4183442, "tid": 31331, "ts": 667115533013.128, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115533015.865, "dur": 2.894, + "args": { + "External id": 230455,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115533016.247, "dur": 2.056, + "args": { + "External id": 230456,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533017.744, "dur": 0.436, + "args": { + "External id": 230457,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115533019.405, "dur": 35.999, + "args": { + "External id": 230458,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115533056.661, "dur": 5.534, + "args": { + "External id": 230459,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115533059.122, "dur": 2.386, + "args": { + "External id": 230460,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533060.874, "dur": 0.528, + "args": { + "External id": 230461,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115533063.753, "dur": 2.733, + "args": { + "External id": 230462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115533064.559, "dur": 1.517, + "args": { + "External id": 230463,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533065.728, "dur": 0.280, + "args": { + "External id": 230464,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115533066.932, "dur": 30.652, + "args": { + "External id": 230465,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533111.328, "dur": 25.556, + "args": { + "External id": 230466,"Record function id": 0, "Sequence number": 2757892, "Fwd thread id": 1, "Ev Idx": 577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533114.365, "dur": 4.047, + "args": { + "External id": 230467,"Sequence number": 2757892, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 578 + } + }, + { + "ph": "f", "id": 64, "pid": 4183442, "tid": 31331, "ts": 667115533114.365, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533116.190, "dur": 2.074, + "args": { + "External id": 230468,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533117.111, "dur": 1.040, + "args": { + "External id": 230469,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115533120.552, "dur": 14.343, + "args": { + "External id": 230470,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533140.591, "dur": 10.936, + "args": { + "External id": 230471,"Record function id": 0, "Sequence number": 2757891, "Fwd thread id": 1, "Ev Idx": 582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533141.488, "dur": 7.161, + "args": { + "External id": 230472,"Sequence number": 2757891, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 583 + } + }, + { + "ph": "f", "id": 65, "pid": 4183442, "tid": 31331, "ts": 667115533141.488, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115533142.197, "dur": 6.244, + "args": { + "External id": 230473,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115533144.451, "dur": 3.464, + "args": { + "External id": 230474,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533147.106, "dur": 0.656, + "args": { + "External id": 230475,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115533155.611, "dur": 5.229, + "args": { + "External id": 230476,"Record function id": 0, "Ev Idx": 587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115533157.332, "dur": 3.043, + "args": { + "External id": 230477,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115533158.191, "dur": 1.864, + "args": { + "External id": 230478,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115533158.616, "dur": 1.341, + "args": { + "External id": 230479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115533165.291, "dur": 380.126, + "args": { + "External id": 230480,"Record function id": 0, "Sequence number": 2757890, "Fwd thread id": 1, "Ev Idx": 591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115533167.046, "dur": 320.547, + "args": { + "External id": 230481,"Sequence number": 2757890, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 592 + } + }, + { + "ph": "f", "id": 66, "pid": 4183442, "tid": 31331, "ts": 667115533167.046, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533201.341, "dur": 2.163, + "args": { + "External id": 230482,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533202.208, "dur": 1.126, + "args": { + "External id": 230483,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115533217.979, "dur": 5.161, + "args": { + "External id": 230484,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115533235.667, "dur": 4.721, + "args": { + "External id": 230485,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533387.840, "dur": 1.917, + "args": { + "External id": 230486,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115533394.106, "dur": 35.081, + "args": { + "External id": 230487,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533404.383, "dur": 0.837, + "args": { + "External id": 230488,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115533434.753, "dur": 28.927, + "args": { + "External id": 230489,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115533436.592, "dur": 26.807, + "args": { + "External id": 230490,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533441.146, "dur": 3.870, + "args": { + "External id": 230491,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115533446.653, "dur": 16.245, + "args": { + "External id": 230492,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115533468.020, "dur": 4.773, + "args": { + "External id": 230493,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533471.454, "dur": 1.196, + "args": { + "External id": 230494,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533478.895, "dur": 1.920, + "args": { + "External id": 230495,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533479.996, "dur": 0.725, + "args": { + "External id": 230496,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115533520.171, "dur": 19.006, + "args": { + "External id": 230497,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115533558.411, "dur": 9.373, + "args": { + "External id": 230498,"Record function id": 0, "Ev Idx": 609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115533560.821, "dur": 6.199, + "args": { + "External id": 230499,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115533562.899, "dur": 3.114, + "args": { + "External id": 230500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115533563.758, "dur": 2.133, + "args": { + "External id": 230501,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533573.786, "dur": 6.999, + "args": { + "External id": 230502,"Record function id": 0, "Sequence number": 2757889, "Fwd thread id": 1, "Ev Idx": 613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115533575.128, "dur": 1.612, + "args": { + "External id": 230503,"Sequence number": 2757889, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 614 + } + }, + { + "ph": "f", "id": 67, "pid": 4183442, "tid": 31331, "ts": 667115533575.128, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115533584.591, "dur": 455.218, + "args": { + "External id": 230504,"Record function id": 0, "Sequence number": 2757888, "Fwd thread id": 1, "Ev Idx": 615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115533586.309, "dur": 440.516, + "args": { + "External id": 230505,"Sequence number": 2757888, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 616 + } + }, + { + "ph": "f", "id": 68, "pid": 4183442, "tid": 31331, "ts": 667115533586.309, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533618.822, "dur": 8.801, + "args": { + "External id": 230506,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115533624.295, "dur": 3.061, + "args": { + "External id": 230507,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115533630.984, "dur": 6.459, + "args": { + "External id": 230508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115533632.275, "dur": 4.504, + "args": { + "External id": 230509,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533634.021, "dur": 2.586, + "args": { + "External id": 230510,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 31331, + "ts": 667115533642.591, "dur": 137.616, + "args": { + "External id": 230511,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115533643.412, "dur": 2.686, + "args": { + "External id": 230512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115533643.807, "dur": 1.812, + "args": { + "External id": 230513,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533645.196, "dur": 0.340, + "args": { + "External id": 230514,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 31331, + "ts": 667115533647.290, "dur": 132.148, + "args": { + "External id": 230515,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115533648.455, "dur": 129.880, + "args": { + "External id": 230516,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115533785.582, "dur": 5.706, + "args": { + "External id": 230517,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533788.960, "dur": 2.200, + "args": { + "External id": 230518,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115533825.367, "dur": 5.551, + "args": { + "External id": 230519,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115533832.458, "dur": 2.179, + "args": { + "External id": 230520,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115533835.718, "dur": 1.532, + "args": { + "External id": 230521,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533869.192, "dur": 2.921, + "args": { + "External id": 230522,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533870.267, "dur": 1.656, + "args": { + "External id": 230523,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183442, "tid": 31331, + "ts": 667115533894.883, "dur": 112.799, + "args": { + "External id": 230524,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115533899.735, "dur": 7.493, + "args": { + "External id": 230525,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533903.417, "dur": 2.993, + "args": { + "External id": 230526,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115533909.049, "dur": 6.466, + "args": { + "External id": 230527,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533914.100, "dur": 0.741, + "args": { + "External id": 230528,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115533916.782, "dur": 2.310, + "args": { + "External id": 230529,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533918.418, "dur": 0.283, + "args": { + "External id": 230530,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115533919.941, "dur": 3.217, + "args": { + "External id": 230531,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533922.056, "dur": 0.664, + "args": { + "External id": 230532,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115533926.768, "dur": 3.369, + "args": { + "External id": 230533,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533929.154, "dur": 0.669, + "args": { + "External id": 230534,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533932.564, "dur": 5.717, + "args": { + "External id": 230535,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115533936.430, "dur": 1.673, + "args": { + "External id": 230536,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115533939.142, "dur": 2.919, + "args": { + "External id": 230537,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115533941.237, "dur": 0.490, + "args": { + "External id": 230538,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115533943.237, "dur": 3.414, + "args": { + "External id": 230539,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533944.029, "dur": 2.521, + "args": { + "External id": 230540,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115533948.329, "dur": 47.231, + "args": { + "External id": 230541,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115533997.407, "dur": 1.157, + "args": { + "External id": 230542,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115533999.574, "dur": 3.629, + "args": { + "External id": 230543,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534001.870, "dur": 0.561, + "args": { + "External id": 230544,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534005.639, "dur": 0.920, + "args": { + "External id": 230545,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534051.569, "dur": 9.160, + "args": { + "External id": 230546,"Record function id": 0, "Ev Idx": 657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534053.810, "dur": 6.237, + "args": { + "External id": 230547,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115534056.030, "dur": 3.206, + "args": { + "External id": 230548,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115534057.042, "dur": 2.077, + "args": { + "External id": 230549,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534064.738, "dur": 7.856, + "args": { + "External id": 230550,"Record function id": 0, "Sequence number": 2757887, "Fwd thread id": 1, "Ev Idx": 661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534066.327, "dur": 3.640, + "args": { + "External id": 230551,"Sequence number": 2757887, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 662 + } + }, + { + "ph": "f", "id": 69, "pid": 4183442, "tid": 31331, "ts": 667115534066.327, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534067.932, "dur": 1.859, + "args": { + "External id": 230552,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534068.807, "dur": 0.851, + "args": { + "External id": 230553,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534076.128, "dur": 104.853, + "args": { + "External id": 230554,"Record function id": 0, "Sequence number": 2757886, "Fwd thread id": 1, "Ev Idx": 665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534077.254, "dur": 94.981, + "args": { + "External id": 230555,"Sequence number": 2757886, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 666 + } + }, + { + "ph": "f", "id": 70, "pid": 4183442, "tid": 31331, "ts": 667115534077.254, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534082.519, "dur": 4.282, + "args": { + "External id": 230556,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534083.894, "dur": 2.333, + "args": { + "External id": 230557,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534085.610, "dur": 0.475, + "args": { + "External id": 230558,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115534088.325, "dur": 32.093, + "args": { + "External id": 230559,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534121.556, "dur": 6.042, + "args": { + "External id": 230560,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534122.329, "dur": 4.447, + "args": { + "External id": 230561,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534125.605, "dur": 1.007, + "args": { + "External id": 230562,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534129.402, "dur": 4.527, + "args": { + "External id": 230563,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534130.190, "dur": 3.292, + "args": { + "External id": 230564,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534131.225, "dur": 2.171, + "args": { + "External id": 230565,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115534134.362, "dur": 37.049, + "args": { + "External id": 230566,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534185.844, "dur": 7.325, + "args": { + "External id": 230567,"Record function id": 0, "Sequence number": 2757885, "Fwd thread id": 1, "Ev Idx": 678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534187.084, "dur": 4.066, + "args": { + "External id": 230568,"Sequence number": 2757885, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 679 + } + }, + { + "ph": "f", "id": 71, "pid": 4183442, "tid": 31331, "ts": 667115534187.084, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534188.676, "dur": 2.324, + "args": { + "External id": 230569,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534189.914, "dur": 0.942, + "args": { + "External id": 230570,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534196.652, "dur": 10.183, + "args": { + "External id": 230571,"Record function id": 0, "Sequence number": 2757884, "Fwd thread id": 1, "Ev Idx": 682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534199.195, "dur": 4.813, + "args": { + "External id": 230572,"Sequence number": 2757884, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 683 + } + }, + { + "ph": "f", "id": 72, "pid": 4183442, "tid": 31331, "ts": 667115534199.195, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534199.970, "dur": 3.830, + "args": { + "External id": 230573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534200.785, "dur": 2.529, + "args": { + "External id": 230574,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534202.602, "dur": 0.604, + "args": { + "External id": 230575,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534210.942, "dur": 6.353, + "args": { + "External id": 230576,"Record function id": 0, "Ev Idx": 687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534212.952, "dur": 3.852, + "args": { + "External id": 230577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115534214.286, "dur": 2.029, + "args": { + "External id": 230578,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115534214.866, "dur": 1.351, + "args": { + "External id": 230579,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534220.692, "dur": 8.057, + "args": { + "External id": 230580,"Record function id": 0, "Sequence number": 2757883, "Fwd thread id": 1, "Ev Idx": 691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534222.196, "dur": 4.244, + "args": { + "External id": 230581,"Sequence number": 2757883, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 692 + } + }, + { + "ph": "f", "id": 73, "pid": 4183442, "tid": 31331, "ts": 667115534222.196, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534223.231, "dur": 3.062, + "args": { + "External id": 230582,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534225.463, "dur": 0.685, + "args": { + "External id": 230583,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534231.812, "dur": 96.636, + "args": { + "External id": 230584,"Record function id": 0, "Sequence number": 2757882, "Fwd thread id": 1, "Ev Idx": 695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534232.704, "dur": 85.599, + "args": { + "External id": 230585,"Sequence number": 2757882, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 696 + } + }, + { + "ph": "f", "id": 74, "pid": 4183442, "tid": 31331, "ts": 667115534232.704, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534235.997, "dur": 6.279, + "args": { + "External id": 230586,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534236.453, "dur": 5.358, + "args": { + "External id": 230587,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534241.176, "dur": 0.503, + "args": { + "External id": 230588,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115534245.018, "dur": 26.305, + "args": { + "External id": 230589,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534272.376, "dur": 6.141, + "args": { + "External id": 230590,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534272.910, "dur": 5.027, + "args": { + "External id": 230591,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534274.509, "dur": 3.270, + "args": { + "External id": 230592,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534279.858, "dur": 4.739, + "args": { + "External id": 230593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534280.613, "dur": 3.406, + "args": { + "External id": 230594,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534283.508, "dur": 0.446, + "args": { + "External id": 230595,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115534285.257, "dur": 32.190, + "args": { + "External id": 230596,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534332.686, "dur": 28.128, + "args": { + "External id": 230597,"Record function id": 0, "Sequence number": 2757881, "Fwd thread id": 1, "Ev Idx": 708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534333.623, "dur": 4.145, + "args": { + "External id": 230598,"Sequence number": 2757881, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 709 + } + }, + { + "ph": "f", "id": 75, "pid": 4183442, "tid": 31331, "ts": 667115534333.623, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534335.376, "dur": 2.228, + "args": { + "External id": 230599,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534336.359, "dur": 1.151, + "args": { + "External id": 230600,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115534340.495, "dur": 17.839, + "args": { + "External id": 230601,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534364.758, "dur": 9.052, + "args": { + "External id": 230602,"Record function id": 0, "Sequence number": 2757880, "Fwd thread id": 1, "Ev Idx": 713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534365.741, "dur": 5.631, + "args": { + "External id": 230603,"Sequence number": 2757880, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 714 + } + }, + { + "ph": "f", "id": 76, "pid": 4183442, "tid": 31331, "ts": 667115534365.741, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534366.767, "dur": 4.384, + "args": { + "External id": 230604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534367.538, "dur": 3.121, + "args": { + "External id": 230605,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534370.210, "dur": 0.318, + "args": { + "External id": 230606,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534377.776, "dur": 4.938, + "args": { + "External id": 230607,"Record function id": 0, "Ev Idx": 718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534379.363, "dur": 2.820, + "args": { + "External id": 230608,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115534380.189, "dur": 1.624, + "args": { + "External id": 230609,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115534380.872, "dur": 0.845, + "args": { + "External id": 230610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115534388.923, "dur": 469.743, + "args": { + "External id": 230611,"Record function id": 0, "Sequence number": 2757879, "Fwd thread id": 1, "Ev Idx": 722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115534390.506, "dur": 431.864, + "args": { + "External id": 230612,"Sequence number": 2757879, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 723 + } + }, + { + "ph": "f", "id": 77, "pid": 4183442, "tid": 31331, "ts": 667115534390.506, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 31331, + "ts": 667115534411.421, "dur": 31.553, + "args": { + "External id": 230613,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115534412.765, "dur": 30.022, + "args": { + "External id": 230614,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115534415.534, "dur": 5.651, + "args": { + "External id": 230615,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115534418.183, "dur": 2.517, + "args": { + "External id": 230616,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115534422.334, "dur": 20.010, + "args": { + "External id": 230617,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534453.354, "dur": 5.756, + "args": { + "External id": 230618,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534455.917, "dur": 3.036, + "args": { + "External id": 230619,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534463.096, "dur": 1.374, + "args": { + "External id": 230620,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534463.714, "dur": 0.658, + "args": { + "External id": 230621,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115534476.109, "dur": 2.094, + "args": { + "External id": 230622,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115534489.198, "dur": 21.942, + "args": { + "External id": 230623,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534710.905, "dur": 3.651, + "args": { + "External id": 230624,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115534718.865, "dur": 33.244, + "args": { + "External id": 230625,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534728.730, "dur": 0.927, + "args": { + "External id": 230626,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115534758.372, "dur": 27.326, + "args": { + "External id": 230627,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115534759.926, "dur": 25.559, + "args": { + "External id": 230628,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534764.236, "dur": 4.280, + "args": { + "External id": 230629,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115534769.623, "dur": 15.317, + "args": { + "External id": 230630,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115534790.556, "dur": 4.652, + "args": { + "External id": 230631,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534793.714, "dur": 1.362, + "args": { + "External id": 230632,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534802.500, "dur": 5.075, + "args": { + "External id": 230633,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534804.461, "dur": 3.011, + "args": { + "External id": 230634,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534810.248, "dur": 2.440, + "args": { + "External id": 230635,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534811.572, "dur": 1.035, + "args": { + "External id": 230636,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115534840.358, "dur": 16.776, + "args": { + "External id": 230637,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534872.198, "dur": 11.339, + "args": { + "External id": 230638,"Record function id": 0, "Ev Idx": 749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115534874.910, "dur": 7.909, + "args": { + "External id": 230639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115534876.731, "dur": 5.021, + "args": { + "External id": 230640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115534879.843, "dur": 1.822, + "args": { + "External id": 230641,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534893.961, "dur": 9.295, + "args": { + "External id": 230642,"Record function id": 0, "Sequence number": 2757878, "Fwd thread id": 1, "Ev Idx": 753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534895.557, "dur": 4.050, + "args": { + "External id": 230643,"Sequence number": 2757878, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 754 + } + }, + { + "ph": "f", "id": 78, "pid": 4183442, "tid": 31331, "ts": 667115534895.557, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115534897.370, "dur": 2.006, + "args": { + "External id": 230644,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115534898.111, "dur": 1.091, + "args": { + "External id": 230645,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534906.830, "dur": 136.283, + "args": { + "External id": 230646,"Record function id": 0, "Sequence number": 2757877, "Fwd thread id": 1, "Ev Idx": 757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115534907.990, "dur": 128.174, + "args": { + "External id": 230647,"Sequence number": 2757877, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 758 + } + }, + { + "ph": "f", "id": 79, "pid": 4183442, "tid": 31331, "ts": 667115534907.990, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534912.308, "dur": 6.519, + "args": { + "External id": 230648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534915.575, "dur": 2.674, + "args": { + "External id": 230649,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534917.409, "dur": 0.622, + "args": { + "External id": 230650,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115534920.089, "dur": 66.556, + "args": { + "External id": 230651,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534987.940, "dur": 6.026, + "args": { + "External id": 230652,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534988.504, "dur": 4.728, + "args": { + "External id": 230653,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534990.377, "dur": 2.661, + "args": { + "External id": 230654,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115534996.888, "dur": 3.365, + "args": { + "External id": 230655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115534998.026, "dur": 1.746, + "args": { + "External id": 230656,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115534999.215, "dur": 0.473, + "args": { + "External id": 230657,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115535000.954, "dur": 34.227, + "args": { + "External id": 230658,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535047.832, "dur": 9.501, + "args": { + "External id": 230659,"Record function id": 0, "Sequence number": 2757876, "Fwd thread id": 1, "Ev Idx": 770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535048.900, "dur": 5.932, + "args": { + "External id": 230660,"Sequence number": 2757876, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 771 + } + }, + { + "ph": "f", "id": 80, "pid": 4183442, "tid": 31331, "ts": 667115535048.900, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115535050.879, "dur": 3.810, + "args": { + "External id": 230661,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115535051.952, "dur": 2.572, + "args": { + "External id": 230662,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535060.750, "dur": 9.209, + "args": { + "External id": 230663,"Record function id": 0, "Sequence number": 2757875, "Fwd thread id": 1, "Ev Idx": 774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535063.760, "dur": 4.357, + "args": { + "External id": 230664,"Sequence number": 2757875, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 775 + } + }, + { + "ph": "f", "id": 81, "pid": 4183442, "tid": 31331, "ts": 667115535063.760, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115535064.530, "dur": 3.372, + "args": { + "External id": 230665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115535065.244, "dur": 2.202, + "args": { + "External id": 230666,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535066.928, "dur": 0.412, + "args": { + "External id": 230667,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115535073.970, "dur": 4.970, + "args": { + "External id": 230668,"Record function id": 0, "Ev Idx": 779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115535075.623, "dur": 2.772, + "args": { + "External id": 230669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115535076.717, "dur": 1.387, + "args": { + "External id": 230670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115535077.136, "dur": 0.872, + "args": { + "External id": 230671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535081.890, "dur": 8.377, + "args": { + "External id": 230672,"Record function id": 0, "Sequence number": 2757874, "Fwd thread id": 1, "Ev Idx": 783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535082.794, "dur": 5.503, + "args": { + "External id": 230673,"Sequence number": 2757874, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 784 + } + }, + { + "ph": "f", "id": 82, "pid": 4183442, "tid": 31331, "ts": 667115535082.794, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115535086.317, "dur": 1.817, + "args": { + "External id": 230674,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115535086.954, "dur": 1.080, + "args": { + "External id": 230675,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115535094.813, "dur": 272.972, + "args": { + "External id": 230676,"Record function id": 0, "Sequence number": 2757873, "Fwd thread id": 1, "Ev Idx": 787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115535096.340, "dur": 248.400, + "args": { + "External id": 230677,"Sequence number": 2757873, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 788 + } + }, + { + "ph": "f", "id": 83, "pid": 4183442, "tid": 31331, "ts": 667115535096.340, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115535112.400, "dur": 6.114, + "args": { + "External id": 230678,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535114.932, "dur": 3.124, + "args": { + "External id": 230679,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115535120.667, "dur": 4.135, + "args": { + "External id": 230680,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535122.210, "dur": 2.391, + "args": { + "External id": 230681,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115535126.636, "dur": 5.206, + "args": { + "External id": 230682,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535128.480, "dur": 3.157, + "args": { + "External id": 230683,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115535155.034, "dur": 165.719, + "args": { + "External id": 230684,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115535230.889, "dur": 3.629, + "args": { + "External id": 230685,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115535236.406, "dur": 3.481, + "args": { + "External id": 230686,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115535331.872, "dur": 3.221, + "args": { + "External id": 230687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115535338.539, "dur": 0.927, + "args": { + "External id": 230688,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115535341.184, "dur": 0.725, + "args": { + "External id": 230689,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115535374.874, "dur": 238.069, + "args": { + "External id": 230690,"Record function id": 0, "Sequence number": 2757872, "Fwd thread id": 1, "Ev Idx": 801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115535376.528, "dur": 226.450, + "args": { + "External id": 230691,"Sequence number": 2757872, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 802 + } + }, + { + "ph": "f", "id": 84, "pid": 4183442, "tid": 31331, "ts": 667115535376.528, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115535395.446, "dur": 42.728, + "args": { + "External id": 230692,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535398.513, "dur": 2.565, + "args": { + "External id": 230693,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115535402.376, "dur": 35.111, + "args": { + "External id": 230694,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115535447.385, "dur": 3.983, + "args": { + "External id": 230695,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535448.972, "dur": 2.136, + "args": { + "External id": 230696,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115535622.081, "dur": 195.307, + "args": { + "External id": 230697,"Record function id": 0, "Sequence number": 2757871, "Fwd thread id": 1, "Ev Idx": 808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115535624.289, "dur": 185.185, + "args": { + "External id": 230698,"Sequence number": 2757871, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 809 + } + }, + { + "ph": "f", "id": 85, "pid": 4183442, "tid": 31331, "ts": 667115535624.289, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115535636.533, "dur": 69.187, + "args": { + "External id": 230699,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535639.469, "dur": 3.545, + "args": { + "External id": 230700,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115535644.037, "dur": 60.578, + "args": { + "External id": 230701,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115535714.850, "dur": 5.607, + "args": { + "External id": 230702,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535716.859, "dur": 3.313, + "args": { + "External id": 230703,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535825.409, "dur": 18.272, + "args": { + "External id": 230704,"Record function id": 0, "Sequence number": 2757870, "Fwd thread id": 1, "Ev Idx": 815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535827.090, "dur": 12.635, + "args": { + "External id": 230705,"Sequence number": 2757870, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 816 + } + }, + { + "ph": "f", "id": 86, "pid": 4183442, "tid": 31331, "ts": 667115535827.090, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115535829.311, "dur": 10.043, + "args": { + "External id": 230706,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115535833.094, "dur": 6.027, + "args": { + "External id": 230707,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535847.541, "dur": 7.924, + "args": { + "External id": 230708,"Record function id": 0, "Sequence number": 2757869, "Fwd thread id": 1, "Ev Idx": 819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535848.539, "dur": 4.204, + "args": { + "External id": 230709,"Sequence number": 2757869, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 820 + } + }, + { + "ph": "f", "id": 87, "pid": 4183442, "tid": 31331, "ts": 667115535848.539, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115535850.343, "dur": 2.239, + "args": { + "External id": 230710,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115535851.674, "dur": 0.788, + "args": { + "External id": 230711,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535860.727, "dur": 7.184, + "args": { + "External id": 230712,"Record function id": 0, "Sequence number": 2757868, "Fwd thread id": 1, "Ev Idx": 823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535861.398, "dur": 4.364, + "args": { + "External id": 230713,"Sequence number": 2757868, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 824 + } + }, + { + "ph": "f", "id": 88, "pid": 4183442, "tid": 31331, "ts": 667115535861.398, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115535863.361, "dur": 2.263, + "args": { + "External id": 230714,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115535864.826, "dur": 0.664, + "args": { + "External id": 230715,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535871.865, "dur": 9.762, + "args": { + "External id": 230716,"Record function id": 0, "Sequence number": 2757867, "Fwd thread id": 1, "Ev Idx": 827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535873.549, "dur": 5.723, + "args": { + "External id": 230717,"Sequence number": 2757867, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 828 + } + }, + { + "ph": "f", "id": 89, "pid": 4183442, "tid": 31331, "ts": 667115535873.549, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115535875.129, "dur": 3.987, + "args": { + "External id": 230718,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115535878.121, "dur": 0.891, + "args": { + "External id": 230719,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535884.946, "dur": 155.771, + "args": { + "External id": 230720,"Record function id": 0, "Sequence number": 2757866, "Fwd thread id": 1, "Ev Idx": 831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115535885.855, "dur": 145.969, + "args": { + "External id": 230721,"Sequence number": 2757866, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 832 + } + }, + { + "ph": "f", "id": 90, "pid": 4183442, "tid": 31331, "ts": 667115535885.855, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115535890.167, "dur": 6.874, + "args": { + "External id": 230722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115535892.177, "dur": 4.217, + "args": { + "External id": 230723,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535894.637, "dur": 1.493, + "args": { + "External id": 230724,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115535900.190, "dur": 77.158, + "args": { + "External id": 230725,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115535978.753, "dur": 5.667, + "args": { + "External id": 230726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115535979.585, "dur": 3.661, + "args": { + "External id": 230727,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535981.816, "dur": 1.215, + "args": { + "External id": 230728,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115535986.333, "dur": 5.055, + "args": { + "External id": 230729,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115535987.531, "dur": 3.385, + "args": { + "External id": 230730,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115535990.435, "dur": 0.390, + "args": { + "External id": 230731,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115535992.322, "dur": 38.655, + "args": { + "External id": 230732,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536045.211, "dur": 8.144, + "args": { + "External id": 230733,"Record function id": 0, "Sequence number": 2757865, "Fwd thread id": 1, "Ev Idx": 844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536046.370, "dur": 4.539, + "args": { + "External id": 230734,"Sequence number": 2757865, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 845 + } + }, + { + "ph": "f", "id": 91, "pid": 4183442, "tid": 31331, "ts": 667115536046.370, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536048.158, "dur": 2.585, + "args": { + "External id": 230735,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536049.465, "dur": 1.141, + "args": { + "External id": 230736,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536056.809, "dur": 9.620, + "args": { + "External id": 230737,"Record function id": 0, "Sequence number": 2757864, "Fwd thread id": 1, "Ev Idx": 848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536058.000, "dur": 6.806, + "args": { + "External id": 230738,"Sequence number": 2757864, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 849 + } + }, + { + "ph": "f", "id": 92, "pid": 4183442, "tid": 31331, "ts": 667115536058.000, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536059.186, "dur": 5.434, + "args": { + "External id": 230739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536059.870, "dur": 4.250, + "args": { + "External id": 230740,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536063.511, "dur": 0.504, + "args": { + "External id": 230741,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536072.000, "dur": 9.466, + "args": { + "External id": 230742,"Record function id": 0, "Ev Idx": 853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536074.269, "dur": 6.538, + "args": { + "External id": 230743,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115536076.711, "dur": 3.691, + "args": { + "External id": 230744,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115536077.773, "dur": 2.494, + "args": { + "External id": 230745,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536084.902, "dur": 7.179, + "args": { + "External id": 230746,"Record function id": 0, "Sequence number": 2757863, "Fwd thread id": 1, "Ev Idx": 857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536086.301, "dur": 3.315, + "args": { + "External id": 230747,"Sequence number": 2757863, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 858 + } + }, + { + "ph": "f", "id": 93, "pid": 4183442, "tid": 31331, "ts": 667115536086.301, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536088.034, "dur": 1.441, + "args": { + "External id": 230748,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536088.612, "dur": 0.754, + "args": { + "External id": 230749,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536095.469, "dur": 96.161, + "args": { + "External id": 230750,"Record function id": 0, "Sequence number": 2757862, "Fwd thread id": 1, "Ev Idx": 861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536096.390, "dur": 89.313, + "args": { + "External id": 230751,"Sequence number": 2757862, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 862 + } + }, + { + "ph": "f", "id": 94, "pid": 4183442, "tid": 31331, "ts": 667115536096.390, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536101.562, "dur": 3.608, + "args": { + "External id": 230752,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536102.187, "dur": 2.501, + "args": { + "External id": 230753,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536104.072, "dur": 0.502, + "args": { + "External id": 230754,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115536106.280, "dur": 33.239, + "args": { + "External id": 230755,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536140.649, "dur": 3.812, + "args": { + "External id": 230756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536141.112, "dur": 2.748, + "args": { + "External id": 230757,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536142.670, "dur": 1.075, + "args": { + "External id": 230758,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536148.173, "dur": 5.309, + "args": { + "External id": 230759,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536149.294, "dur": 3.744, + "args": { + "External id": 230760,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536150.772, "dur": 2.198, + "args": { + "External id": 230761,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115536154.290, "dur": 30.691, + "args": { + "External id": 230762,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536195.946, "dur": 32.558, + "args": { + "External id": 230763,"Record function id": 0, "Sequence number": 2757861, "Fwd thread id": 1, "Ev Idx": 874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536196.809, "dur": 4.510, + "args": { + "External id": 230764,"Sequence number": 2757861, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 875 + } + }, + { + "ph": "f", "id": 95, "pid": 4183442, "tid": 31331, "ts": 667115536196.809, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536198.819, "dur": 2.354, + "args": { + "External id": 230765,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536200.082, "dur": 0.980, + "args": { + "External id": 230766,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115536204.463, "dur": 19.971, + "args": { + "External id": 230767,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536232.399, "dur": 8.067, + "args": { + "External id": 230768,"Record function id": 0, "Sequence number": 2757860, "Fwd thread id": 1, "Ev Idx": 879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536233.578, "dur": 5.407, + "args": { + "External id": 230769,"Sequence number": 2757860, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 880 + } + }, + { + "ph": "f", "id": 96, "pid": 4183442, "tid": 31331, "ts": 667115536233.578, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536234.961, "dur": 3.840, + "args": { + "External id": 230770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536235.903, "dur": 2.376, + "args": { + "External id": 230771,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536237.639, "dur": 0.537, + "args": { + "External id": 230772,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536244.454, "dur": 7.553, + "args": { + "External id": 230773,"Record function id": 0, "Ev Idx": 884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536246.181, "dur": 5.333, + "args": { + "External id": 230774,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115536247.581, "dur": 3.535, + "args": { + "External id": 230775,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115536250.025, "dur": 0.979, + "args": { + "External id": 230776,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536255.265, "dur": 7.189, + "args": { + "External id": 230777,"Record function id": 0, "Sequence number": 2757859, "Fwd thread id": 1, "Ev Idx": 888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536256.882, "dur": 3.284, + "args": { + "External id": 230778,"Sequence number": 2757859, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 889 + } + }, + { + "ph": "f", "id": 97, "pid": 4183442, "tid": 31331, "ts": 667115536256.882, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536258.320, "dur": 1.693, + "args": { + "External id": 230779,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536259.143, "dur": 0.738, + "args": { + "External id": 230780,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536267.252, "dur": 98.810, + "args": { + "External id": 230781,"Record function id": 0, "Sequence number": 2757858, "Fwd thread id": 1, "Ev Idx": 892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536267.972, "dur": 89.731, + "args": { + "External id": 230782,"Sequence number": 2757858, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 893 + } + }, + { + "ph": "f", "id": 98, "pid": 4183442, "tid": 31331, "ts": 667115536267.972, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536270.972, "dur": 4.708, + "args": { + "External id": 230783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536271.507, "dur": 3.703, + "args": { + "External id": 230784,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536274.570, "dur": 0.517, + "args": { + "External id": 230785,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115536276.479, "dur": 36.034, + "args": { + "External id": 230786,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536313.511, "dur": 3.999, + "args": { + "External id": 230787,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536314.179, "dur": 2.779, + "args": { + "External id": 230788,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536315.888, "dur": 0.959, + "args": { + "External id": 230789,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536318.749, "dur": 7.664, + "args": { + "External id": 230790,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536323.458, "dur": 2.122, + "args": { + "External id": 230791,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536325.142, "dur": 0.370, + "args": { + "External id": 230792,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115536326.857, "dur": 30.198, + "args": { + "External id": 230793,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536370.372, "dur": 25.314, + "args": { + "External id": 230794,"Record function id": 0, "Sequence number": 2757857, "Fwd thread id": 1, "Ev Idx": 905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536371.300, "dur": 4.254, + "args": { + "External id": 230795,"Sequence number": 2757857, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 906 + } + }, + { + "ph": "f", "id": 99, "pid": 4183442, "tid": 31331, "ts": 667115536371.300, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536373.276, "dur": 2.125, + "args": { + "External id": 230796,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536374.243, "dur": 1.063, + "args": { + "External id": 230797,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115536377.845, "dur": 15.867, + "args": { + "External id": 230798,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536399.211, "dur": 10.200, + "args": { + "External id": 230799,"Record function id": 0, "Sequence number": 2757856, "Fwd thread id": 1, "Ev Idx": 910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536401.912, "dur": 5.270, + "args": { + "External id": 230800,"Sequence number": 2757856, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 911 + } + }, + { + "ph": "f", "id": 100, "pid": 4183442, "tid": 31331, "ts": 667115536401.912, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536403.280, "dur": 3.726, + "args": { + "External id": 230801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536404.051, "dur": 2.409, + "args": { + "External id": 230802,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536405.875, "dur": 0.443, + "args": { + "External id": 230803,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536413.319, "dur": 5.189, + "args": { + "External id": 230804,"Record function id": 0, "Ev Idx": 915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536414.833, "dur": 3.180, + "args": { + "External id": 230805,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115536415.964, "dur": 1.768, + "args": { + "External id": 230806,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115536416.554, "dur": 1.054, + "args": { + "External id": 230807,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115536423.191, "dur": 421.119, + "args": { + "External id": 230808,"Record function id": 0, "Sequence number": 2757855, "Fwd thread id": 1, "Ev Idx": 919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115536424.646, "dur": 384.442, + "args": { + "External id": 230809,"Sequence number": 2757855, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 920 + } + }, + { + "ph": "f", "id": 101, "pid": 4183442, "tid": 31331, "ts": 667115536424.646, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536453.665, "dur": 3.721, + "args": { + "External id": 230810,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536455.982, "dur": 1.249, + "args": { + "External id": 230811,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115536470.832, "dur": 5.023, + "args": { + "External id": 230812,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115536484.708, "dur": 2.851, + "args": { + "External id": 230813,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536649.121, "dur": 40.050, + "args": { + "External id": 230814,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115536695.345, "dur": 42.993, + "args": { + "External id": 230815,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536708.379, "dur": 0.952, + "args": { + "External id": 230816,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115536749.211, "dur": 34.885, + "args": { + "External id": 230817,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115536750.957, "dur": 32.932, + "args": { + "External id": 230818,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536757.495, "dur": 5.319, + "args": { + "External id": 230819,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115536764.550, "dur": 18.796, + "args": { + "External id": 230820,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115536788.715, "dur": 2.525, + "args": { + "External id": 230821,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536790.020, "dur": 1.113, + "args": { + "External id": 230822,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536798.021, "dur": 2.443, + "args": { + "External id": 230823,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115536799.323, "dur": 1.043, + "args": { + "External id": 230824,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115536823.258, "dur": 16.622, + "args": { + "External id": 230825,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536857.503, "dur": 8.613, + "args": { + "External id": 230826,"Record function id": 0, "Ev Idx": 937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115536859.823, "dur": 5.601, + "args": { + "External id": 230827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115536861.945, "dur": 2.560, + "args": { + "External id": 230828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115536862.736, "dur": 1.680, + "args": { + "External id": 230829,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536870.004, "dur": 6.758, + "args": { + "External id": 230830,"Record function id": 0, "Sequence number": 2757854, "Fwd thread id": 1, "Ev Idx": 941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115536871.048, "dur": 1.564, + "args": { + "External id": 230831,"Sequence number": 2757854, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 942 + } + }, + { + "ph": "f", "id": 102, "pid": 4183442, "tid": 31331, "ts": 667115536871.048, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115536881.129, "dur": 396.912, + "args": { + "External id": 230832,"Record function id": 0, "Sequence number": 2757853, "Fwd thread id": 1, "Ev Idx": 943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115536882.481, "dur": 381.223, + "args": { + "External id": 230833,"Sequence number": 2757853, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 944 + } + }, + { + "ph": "f", "id": 103, "pid": 4183442, "tid": 31331, "ts": 667115536882.481, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115536914.260, "dur": 8.878, + "args": { + "External id": 230834,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115536919.847, "dur": 2.974, + "args": { + "External id": 230835,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536926.292, "dur": 5.884, + "args": { + "External id": 230836,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536927.736, "dur": 3.655, + "args": { + "External id": 230837,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536930.340, "dur": 0.859, + "args": { + "External id": 230838,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 31331, + "ts": 667115536935.465, "dur": 90.826, + "args": { + "External id": 230839,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115536936.637, "dur": 6.670, + "args": { + "External id": 230840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115536939.023, "dur": 3.750, + "args": { + "External id": 230841,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115536940.642, "dur": 2.022, + "args": { + "External id": 230842,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 31331, + "ts": 667115536944.463, "dur": 81.213, + "args": { + "External id": 230843,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115536945.980, "dur": 78.639, + "args": { + "External id": 230844,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115537029.960, "dur": 2.574, + "args": { + "External id": 230845,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537030.973, "dur": 1.407, + "args": { + "External id": 230846,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115537064.345, "dur": 4.642, + "args": { + "External id": 230847,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115537070.299, "dur": 2.046, + "args": { + "External id": 230848,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115537073.529, "dur": 2.005, + "args": { + "External id": 230849,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537107.243, "dur": 2.201, + "args": { + "External id": 230850,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537108.275, "dur": 0.998, + "args": { + "External id": 230851,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183442, "tid": 31331, + "ts": 667115537131.503, "dur": 113.412, + "args": { + "External id": 230852,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115537136.465, "dur": 4.973, + "args": { + "External id": 230853,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537139.908, "dur": 0.677, + "args": { + "External id": 230854,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115537143.557, "dur": 7.908, + "args": { + "External id": 230855,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537148.740, "dur": 1.966, + "args": { + "External id": 230856,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115537152.662, "dur": 2.400, + "args": { + "External id": 230857,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537154.327, "dur": 0.372, + "args": { + "External id": 230858,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115537155.839, "dur": 3.396, + "args": { + "External id": 230859,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537157.818, "dur": 0.566, + "args": { + "External id": 230860,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115537162.785, "dur": 3.068, + "args": { + "External id": 230861,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537164.759, "dur": 0.781, + "args": { + "External id": 230862,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537166.959, "dur": 5.614, + "args": { + "External id": 230863,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115537170.748, "dur": 1.670, + "args": { + "External id": 230864,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115537173.584, "dur": 2.458, + "args": { + "External id": 230865,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537175.307, "dur": 0.366, + "args": { + "External id": 230866,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537178.835, "dur": 4.236, + "args": { + "External id": 230867,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537179.966, "dur": 3.016, + "args": { + "External id": 230868,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115537184.344, "dur": 46.137, + "args": { + "External id": 230869,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537232.563, "dur": 2.954, + "args": { + "External id": 230870,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115537236.429, "dur": 4.166, + "args": { + "External id": 230871,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537239.177, "dur": 0.713, + "args": { + "External id": 230872,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537242.953, "dur": 0.828, + "args": { + "External id": 230873,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115537287.146, "dur": 8.168, + "args": { + "External id": 230874,"Record function id": 0, "Ev Idx": 985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115537289.481, "dur": 5.095, + "args": { + "External id": 230875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115537291.278, "dur": 2.516, + "args": { + "External id": 230876,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115537292.066, "dur": 1.630, + "args": { + "External id": 230877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537299.552, "dur": 7.653, + "args": { + "External id": 230878,"Record function id": 0, "Sequence number": 2757852, "Fwd thread id": 1, "Ev Idx": 989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537301.166, "dur": 3.251, + "args": { + "External id": 230879,"Sequence number": 2757852, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 990 + } + }, + { + "ph": "f", "id": 104, "pid": 4183442, "tid": 31331, "ts": 667115537301.166, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537302.534, "dur": 1.715, + "args": { + "External id": 230880,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537303.190, "dur": 0.929, + "args": { + "External id": 230881,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537311.158, "dur": 105.491, + "args": { + "External id": 230882,"Record function id": 0, "Sequence number": 2757851, "Fwd thread id": 1, "Ev Idx": 993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537311.973, "dur": 97.556, + "args": { + "External id": 230883,"Sequence number": 2757851, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 994 + } + }, + { + "ph": "f", "id": 105, "pid": 4183442, "tid": 31331, "ts": 667115537311.973, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537315.298, "dur": 5.649, + "args": { + "External id": 230884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537316.244, "dur": 4.196, + "args": { + "External id": 230885,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537319.581, "dur": 0.715, + "args": { + "External id": 230886,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115537322.145, "dur": 33.530, + "args": { + "External id": 230887,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537356.926, "dur": 4.581, + "args": { + "External id": 230888,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537357.566, "dur": 3.043, + "args": { + "External id": 230889,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537359.302, "dur": 1.147, + "args": { + "External id": 230890,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537363.154, "dur": 5.313, + "args": { + "External id": 230891,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537365.951, "dur": 2.051, + "args": { + "External id": 230892,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537367.596, "dur": 0.338, + "args": { + "External id": 230893,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115537369.196, "dur": 39.367, + "args": { + "External id": 230894,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537421.172, "dur": 6.847, + "args": { + "External id": 230895,"Record function id": 0, "Sequence number": 2757850, "Fwd thread id": 1, "Ev Idx": 1006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537422.449, "dur": 4.089, + "args": { + "External id": 230896,"Sequence number": 2757850, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1007 + } + }, + { + "ph": "f", "id": 106, "pid": 4183442, "tid": 31331, "ts": 667115537422.449, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537424.186, "dur": 2.197, + "args": { + "External id": 230897,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537425.178, "dur": 1.071, + "args": { + "External id": 230898,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537431.612, "dur": 9.700, + "args": { + "External id": 230899,"Record function id": 0, "Sequence number": 2757849, "Fwd thread id": 1, "Ev Idx": 1010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537432.655, "dur": 5.854, + "args": { + "External id": 230900,"Sequence number": 2757849, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1011 + } + }, + { + "ph": "f", "id": 107, "pid": 4183442, "tid": 31331, "ts": 667115537432.655, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537433.784, "dur": 4.512, + "args": { + "External id": 230901,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537435.967, "dur": 1.822, + "args": { + "External id": 230902,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537437.286, "dur": 0.408, + "args": { + "External id": 230903,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115537445.325, "dur": 5.613, + "args": { + "External id": 230904,"Record function id": 0, "Ev Idx": 1015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115537447.024, "dur": 3.396, + "args": { + "External id": 230905,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115537448.355, "dur": 1.541, + "args": { + "External id": 230906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115537448.778, "dur": 1.020, + "args": { + "External id": 230907,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537456.478, "dur": 7.371, + "args": { + "External id": 230908,"Record function id": 0, "Sequence number": 2757848, "Fwd thread id": 1, "Ev Idx": 1019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537457.666, "dur": 3.352, + "args": { + "External id": 230909,"Sequence number": 2757848, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 1020 + } + }, + { + "ph": "f", "id": 108, "pid": 4183442, "tid": 31331, "ts": 667115537457.666, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537459.045, "dur": 1.824, + "args": { + "External id": 230910,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537459.937, "dur": 0.783, + "args": { + "External id": 230911,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537468.842, "dur": 143.958, + "args": { + "External id": 230912,"Record function id": 0, "Sequence number": 2757847, "Fwd thread id": 1, "Ev Idx": 1023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537488.116, "dur": 113.925, + "args": { + "External id": 230913,"Sequence number": 2757847, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1024 + } + }, + { + "ph": "f", "id": 109, "pid": 4183442, "tid": 31331, "ts": 667115537488.116, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537511.997, "dur": 4.569, + "args": { + "External id": 230914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537512.922, "dur": 2.907, + "args": { + "External id": 230915,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 1026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537514.911, "dur": 0.629, + "args": { + "External id": 230916,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115537517.385, "dur": 33.919, + "args": { + "External id": 230917,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 1028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537554.541, "dur": 4.976, + "args": { + "External id": 230918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537555.107, "dur": 3.772, + "args": { + "External id": 230919,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537556.928, "dur": 1.788, + "args": { + "External id": 230920,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537561.209, "dur": 4.617, + "args": { + "External id": 230921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537562.005, "dur": 3.130, + "args": { + "External id": 230922,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537563.073, "dur": 1.998, + "args": { + "External id": 230923,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115537568.215, "dur": 33.084, + "args": { + "External id": 230924,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537619.392, "dur": 30.967, + "args": { + "External id": 230925,"Record function id": 0, "Sequence number": 2757846, "Fwd thread id": 1, "Ev Idx": 1036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537620.417, "dur": 4.382, + "args": { + "External id": 230926,"Sequence number": 2757846, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1037 + } + }, + { + "ph": "f", "id": 110, "pid": 4183442, "tid": 31331, "ts": 667115537620.417, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537622.165, "dur": 2.485, + "args": { + "External id": 230927,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537623.079, "dur": 1.443, + "args": { + "External id": 230928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115537627.744, "dur": 19.501, + "args": { + "External id": 230929,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537654.049, "dur": 46.995, + "args": { + "External id": 230930,"Record function id": 0, "Sequence number": 2757845, "Fwd thread id": 1, "Ev Idx": 1041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115537690.017, "dur": 8.115, + "args": { + "External id": 230931,"Sequence number": 2757845, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1042 + } + }, + { + "ph": "f", "id": 111, "pid": 4183442, "tid": 31331, "ts": 667115537690.017, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115537691.536, "dur": 6.374, + "args": { + "External id": 230932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115537692.663, "dur": 4.442, + "args": { + "External id": 230933,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537696.156, "dur": 0.680, + "args": { + "External id": 230934,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115537706.970, "dur": 6.078, + "args": { + "External id": 230935,"Record function id": 0, "Ev Idx": 1046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115537708.713, "dur": 3.745, + "args": { + "External id": 230936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115537709.939, "dur": 2.028, + "args": { + "External id": 230937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115537710.456, "dur": 1.421, + "args": { + "External id": 230938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115537717.540, "dur": 398.188, + "args": { + "External id": 230939,"Record function id": 0, "Sequence number": 2757844, "Fwd thread id": 1, "Ev Idx": 1050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115537719.226, "dur": 365.970, + "args": { + "External id": 230940,"Sequence number": 2757844, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 1051 + } + }, + { + "ph": "f", "id": 112, "pid": 4183442, "tid": 31331, "ts": 667115537719.226, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 31331, + "ts": 667115537743.354, "dur": 36.713, + "args": { + "External id": 230941,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115537744.949, "dur": 34.872, + "args": { + "External id": 230942,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115537747.570, "dur": 6.862, + "args": { + "External id": 230943,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 1054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115537750.484, "dur": 3.482, + "args": { + "External id": 230944,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115537755.862, "dur": 23.320, + "args": { + "External id": 230945,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537791.894, "dur": 2.437, + "args": { + "External id": 230946,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537792.777, "dur": 1.400, + "args": { + "External id": 230947,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115537799.989, "dur": 3.089, + "args": { + "External id": 230948,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537800.563, "dur": 2.382, + "args": { + "External id": 230949,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115537814.251, "dur": 2.415, + "args": { + "External id": 230950,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115537828.040, "dur": 3.014, + "args": { + "External id": 230951,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115537984.623, "dur": 2.163, + "args": { + "External id": 230952,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115537990.881, "dur": 29.531, + "args": { + "External id": 230953,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115537999.179, "dur": 0.886, + "args": { + "External id": 230954,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115538025.872, "dur": 25.632, + "args": { + "External id": 230955,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115538027.527, "dur": 23.767, + "args": { + "External id": 230956,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538031.678, "dur": 3.778, + "args": { + "External id": 230957,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115538036.843, "dur": 13.942, + "args": { + "External id": 230958,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115538056.051, "dur": 2.761, + "args": { + "External id": 230959,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115538057.470, "dur": 1.201, + "args": { + "External id": 230960,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115538067.274, "dur": 2.287, + "args": { + "External id": 230961,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115538068.331, "dur": 1.108, + "args": { + "External id": 230962,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115538072.076, "dur": 4.347, + "args": { + "External id": 230963,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115538073.074, "dur": 3.258, + "args": { + "External id": 230964,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115538098.469, "dur": 15.801, + "args": { + "External id": 230965,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115538125.547, "dur": 9.730, + "args": { + "External id": 230966,"Record function id": 0, "Ev Idx": 1077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115538127.710, "dur": 6.909, + "args": { + "External id": 230967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115538129.273, "dur": 4.506, + "args": { + "External id": 230968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115538132.038, "dur": 1.614, + "args": { + "External id": 230969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538139.135, "dur": 8.626, + "args": { + "External id": 230970,"Record function id": 0, "Sequence number": 2757843, "Fwd thread id": 1, "Ev Idx": 1081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538140.798, "dur": 3.971, + "args": { + "External id": 230971,"Sequence number": 2757843, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1082 + } + }, + { + "ph": "f", "id": 113, "pid": 4183442, "tid": 31331, "ts": 667115538140.798, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115538142.262, "dur": 2.314, + "args": { + "External id": 230972,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115538143.238, "dur": 1.188, + "args": { + "External id": 230973,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538151.272, "dur": 136.976, + "args": { + "External id": 230974,"Record function id": 0, "Sequence number": 2757842, "Fwd thread id": 1, "Ev Idx": 1085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538152.336, "dur": 128.325, + "args": { + "External id": 230975,"Sequence number": 2757842, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1086 + } + }, + { + "ph": "f", "id": 114, "pid": 4183442, "tid": 31331, "ts": 667115538152.336, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115538157.098, "dur": 5.771, + "args": { + "External id": 230976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115538158.110, "dur": 4.204, + "args": { + "External id": 230977,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538161.312, "dur": 0.846, + "args": { + "External id": 230978,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115538164.049, "dur": 66.120, + "args": { + "External id": 230979,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115538231.497, "dur": 5.925, + "args": { + "External id": 230980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115538232.224, "dur": 4.473, + "args": { + "External id": 230981,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538234.091, "dur": 2.446, + "args": { + "External id": 230982,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115538239.061, "dur": 4.741, + "args": { + "External id": 230983,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115538241.787, "dur": 1.532, + "args": { + "External id": 230984,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538242.933, "dur": 0.317, + "args": { + "External id": 230985,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115538244.713, "dur": 34.980, + "args": { + "External id": 230986,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538293.083, "dur": 10.293, + "args": { + "External id": 230987,"Record function id": 0, "Sequence number": 2757841, "Fwd thread id": 1, "Ev Idx": 1098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538294.485, "dur": 6.609, + "args": { + "External id": 230988,"Sequence number": 2757841, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1099 + } + }, + { + "ph": "f", "id": 115, "pid": 4183442, "tid": 31331, "ts": 667115538294.485, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115538296.697, "dur": 4.230, + "args": { + "External id": 230989,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115538297.689, "dur": 3.083, + "args": { + "External id": 230990,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538306.516, "dur": 9.036, + "args": { + "External id": 230991,"Record function id": 0, "Sequence number": 2757840, "Fwd thread id": 1, "Ev Idx": 1102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538308.039, "dur": 5.786, + "args": { + "External id": 230992,"Sequence number": 2757840, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1103 + } + }, + { + "ph": "f", "id": 116, "pid": 4183442, "tid": 31331, "ts": 667115538308.039, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115538308.877, "dur": 4.738, + "args": { + "External id": 230993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115538311.206, "dur": 1.882, + "args": { + "External id": 230994,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538312.670, "dur": 0.308, + "args": { + "External id": 230995,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115538319.479, "dur": 5.212, + "args": { + "External id": 230996,"Record function id": 0, "Ev Idx": 1107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115538321.178, "dur": 3.017, + "args": { + "External id": 230997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115538322.243, "dur": 1.568, + "args": { + "External id": 230998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115538322.671, "dur": 1.027, + "args": { + "External id": 230999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538329.577, "dur": 7.318, + "args": { + "External id": 231000,"Record function id": 0, "Sequence number": 2757839, "Fwd thread id": 1, "Ev Idx": 1111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115538330.424, "dur": 3.734, + "args": { + "External id": 231001,"Sequence number": 2757839, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1112 + } + }, + { + "ph": "f", "id": 117, "pid": 4183442, "tid": 31331, "ts": 667115538330.424, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115538331.851, "dur": 2.153, + "args": { + "External id": 231002,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115538332.557, "dur": 1.311, + "args": { + "External id": 231003,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115538341.717, "dur": 389.139, + "args": { + "External id": 231004,"Record function id": 0, "Sequence number": 2757838, "Fwd thread id": 1, "Ev Idx": 1115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115538343.337, "dur": 363.409, + "args": { + "External id": 231005,"Sequence number": 2757838, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1116 + } + }, + { + "ph": "f", "id": 118, "pid": 4183442, "tid": 31331, "ts": 667115538343.337, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115538358.101, "dur": 6.548, + "args": { + "External id": 231006,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538361.076, "dur": 3.206, + "args": { + "External id": 231007,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115538367.100, "dur": 4.301, + "args": { + "External id": 231008,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538368.676, "dur": 2.539, + "args": { + "External id": 231009,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115538382.188, "dur": 5.729, + "args": { + "External id": 231010,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538385.621, "dur": 2.083, + "args": { + "External id": 231011,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115538414.058, "dur": 229.285, + "args": { + "External id": 231012,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115538486.197, "dur": 26.050, + "args": { + "External id": 231013,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115538515.361, "dur": 4.955, + "args": { + "External id": 231014,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115538690.681, "dur": 4.560, + "args": { + "External id": 231015,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115538700.366, "dur": 0.775, + "args": { + "External id": 231016,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115538703.141, "dur": 0.703, + "args": { + "External id": 231017,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115538741.999, "dur": 224.338, + "args": { + "External id": 231018,"Record function id": 0, "Sequence number": 2757837, "Fwd thread id": 1, "Ev Idx": 1129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115538744.143, "dur": 214.999, + "args": { + "External id": 231019,"Sequence number": 2757837, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1130 + } + }, + { + "ph": "f", "id": 119, "pid": 4183442, "tid": 31331, "ts": 667115538744.143, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115538764.981, "dur": 46.108, + "args": { + "External id": 231020,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538768.516, "dur": 3.721, + "args": { + "External id": 231021,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115538773.770, "dur": 36.708, + "args": { + "External id": 231022,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115538821.042, "dur": 5.743, + "args": { + "External id": 231023,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538823.348, "dur": 3.123, + "args": { + "External id": 231024,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115538973.337, "dur": 144.065, + "args": { + "External id": 231025,"Record function id": 0, "Sequence number": 2757836, "Fwd thread id": 1, "Ev Idx": 1136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115538975.295, "dur": 134.891, + "args": { + "External id": 231026,"Sequence number": 2757836, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1137 + } + }, + { + "ph": "f", "id": 120, "pid": 4183442, "tid": 31331, "ts": 667115538975.295, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115538986.796, "dur": 33.059, + "args": { + "External id": 231027,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115538989.620, "dur": 2.527, + "args": { + "External id": 231028,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115538996.727, "dur": 22.654, + "args": { + "External id": 231029,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115539027.199, "dur": 4.748, + "args": { + "External id": 231030,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539029.451, "dur": 2.254, + "args": { + "External id": 231031,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539123.388, "dur": 15.282, + "args": { + "External id": 231032,"Record function id": 0, "Sequence number": 2757835, "Fwd thread id": 1, "Ev Idx": 1143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539124.773, "dur": 10.934, + "args": { + "External id": 231033,"Sequence number": 2757835, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1144 + } + }, + { + "ph": "f", "id": 121, "pid": 4183442, "tid": 31331, "ts": 667115539124.773, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539127.063, "dur": 8.331, + "args": { + "External id": 231034,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539128.749, "dur": 6.454, + "args": { + "External id": 231035,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539141.868, "dur": 8.869, + "args": { + "External id": 231036,"Record function id": 0, "Sequence number": 2757834, "Fwd thread id": 1, "Ev Idx": 1147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539144.351, "dur": 4.146, + "args": { + "External id": 231037,"Sequence number": 2757834, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1148 + } + }, + { + "ph": "f", "id": 122, "pid": 4183442, "tid": 31331, "ts": 667115539144.351, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539146.386, "dur": 1.957, + "args": { + "External id": 231038,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539147.283, "dur": 0.941, + "args": { + "External id": 231039,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539153.903, "dur": 6.433, + "args": { + "External id": 231040,"Record function id": 0, "Sequence number": 2757833, "Fwd thread id": 1, "Ev Idx": 1151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539155.025, "dur": 3.008, + "args": { + "External id": 231041,"Sequence number": 2757833, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1152 + } + }, + { + "ph": "f", "id": 123, "pid": 4183442, "tid": 31331, "ts": 667115539155.025, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539156.376, "dur": 1.509, + "args": { + "External id": 231042,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539157.076, "dur": 0.682, + "args": { + "External id": 231043,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539163.604, "dur": 9.215, + "args": { + "External id": 231044,"Record function id": 0, "Sequence number": 2757832, "Fwd thread id": 1, "Ev Idx": 1155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539164.983, "dur": 5.321, + "args": { + "External id": 231045,"Sequence number": 2757832, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1156 + } + }, + { + "ph": "f", "id": 124, "pid": 4183442, "tid": 31331, "ts": 667115539164.983, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539166.380, "dur": 3.765, + "args": { + "External id": 231046,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539168.872, "dur": 1.182, + "args": { + "External id": 231047,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539176.272, "dur": 154.120, + "args": { + "External id": 231048,"Record function id": 0, "Sequence number": 2757831, "Fwd thread id": 1, "Ev Idx": 1159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539177.426, "dur": 144.589, + "args": { + "External id": 231049,"Sequence number": 2757831, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1160 + } + }, + { + "ph": "f", "id": 125, "pid": 4183442, "tid": 31331, "ts": 667115539177.426, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539182.013, "dur": 7.180, + "args": { + "External id": 231050,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539184.101, "dur": 4.473, + "args": { + "External id": 231051,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539186.616, "dur": 1.711, + "args": { + "External id": 231052,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115539190.734, "dur": 74.619, + "args": { + "External id": 231053,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539268.754, "dur": 5.248, + "args": { + "External id": 231054,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539269.486, "dur": 3.727, + "args": { + "External id": 231055,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539271.641, "dur": 1.430, + "args": { + "External id": 231056,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539275.920, "dur": 3.927, + "args": { + "External id": 231057,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539277.020, "dur": 2.206, + "args": { + "External id": 231058,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539278.596, "dur": 0.563, + "args": { + "External id": 231059,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115539282.658, "dur": 38.540, + "args": { + "External id": 231060,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539337.622, "dur": 7.807, + "args": { + "External id": 231061,"Record function id": 0, "Sequence number": 2757830, "Fwd thread id": 1, "Ev Idx": 1172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539338.687, "dur": 4.744, + "args": { + "External id": 231062,"Sequence number": 2757830, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1173 + } + }, + { + "ph": "f", "id": 126, "pid": 4183442, "tid": 31331, "ts": 667115539338.687, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539340.591, "dur": 2.673, + "args": { + "External id": 231063,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539341.949, "dur": 1.163, + "args": { + "External id": 231064,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539348.829, "dur": 9.211, + "args": { + "External id": 231065,"Record function id": 0, "Sequence number": 2757829, "Fwd thread id": 1, "Ev Idx": 1176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539349.695, "dur": 6.653, + "args": { + "External id": 231066,"Sequence number": 2757829, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1177 + } + }, + { + "ph": "f", "id": 127, "pid": 4183442, "tid": 31331, "ts": 667115539349.695, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539350.904, "dur": 5.243, + "args": { + "External id": 231067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539351.650, "dur": 3.990, + "args": { + "External id": 231068,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539354.984, "dur": 0.553, + "args": { + "External id": 231069,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115539363.508, "dur": 9.244, + "args": { + "External id": 231070,"Record function id": 0, "Ev Idx": 1181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115539365.510, "dur": 6.560, + "args": { + "External id": 231071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115539368.058, "dur": 3.615, + "args": { + "External id": 231072,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115539369.168, "dur": 2.405, + "args": { + "External id": 231073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539376.602, "dur": 7.032, + "args": { + "External id": 231074,"Record function id": 0, "Sequence number": 2757828, "Fwd thread id": 1, "Ev Idx": 1185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539378.105, "dur": 3.067, + "args": { + "External id": 231075,"Sequence number": 2757828, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1186 + } + }, + { + "ph": "f", "id": 128, "pid": 4183442, "tid": 31331, "ts": 667115539378.105, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539379.452, "dur": 1.562, + "args": { + "External id": 231076,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539380.052, "dur": 0.825, + "args": { + "External id": 231077,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539386.929, "dur": 94.914, + "args": { + "External id": 231078,"Record function id": 0, "Sequence number": 2757827, "Fwd thread id": 1, "Ev Idx": 1189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539387.702, "dur": 88.432, + "args": { + "External id": 231079,"Sequence number": 2757827, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1190 + } + }, + { + "ph": "f", "id": 129, "pid": 4183442, "tid": 31331, "ts": 667115539387.702, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539391.962, "dur": 2.855, + "args": { + "External id": 231080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539392.469, "dur": 1.894, + "args": { + "External id": 231081,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539393.772, "dur": 0.482, + "args": { + "External id": 231082,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115539395.540, "dur": 33.808, + "args": { + "External id": 231083,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539430.545, "dur": 3.793, + "args": { + "External id": 231084,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539430.969, "dur": 2.724, + "args": { + "External id": 231085,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539432.918, "dur": 0.648, + "args": { + "External id": 231086,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539437.928, "dur": 5.456, + "args": { + "External id": 231087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539438.975, "dur": 3.924, + "args": { + "External id": 231088,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539440.680, "dur": 2.140, + "args": { + "External id": 231089,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115539443.859, "dur": 31.512, + "args": { + "External id": 231090,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539486.160, "dur": 58.839, + "args": { + "External id": 231091,"Record function id": 0, "Sequence number": 2757826, "Fwd thread id": 1, "Ev Idx": 1202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539487.174, "dur": 27.241, + "args": { + "External id": 231092,"Sequence number": 2757826, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1203 + } + }, + { + "ph": "f", "id": 130, "pid": 4183442, "tid": 31331, "ts": 667115539487.174, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539489.085, "dur": 25.125, + "args": { + "External id": 231093,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539511.705, "dur": 2.169, + "args": { + "External id": 231094,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115539518.555, "dur": 23.437, + "args": { + "External id": 231095,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539550.506, "dur": 7.887, + "args": { + "External id": 231096,"Record function id": 0, "Sequence number": 2757825, "Fwd thread id": 1, "Ev Idx": 1207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539551.573, "dur": 5.193, + "args": { + "External id": 231097,"Sequence number": 2757825, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1208 + } + }, + { + "ph": "f", "id": 131, "pid": 4183442, "tid": 31331, "ts": 667115539551.573, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539552.232, "dur": 4.342, + "args": { + "External id": 231098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539553.464, "dur": 2.565, + "args": { + "External id": 231099,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539555.136, "dur": 0.800, + "args": { + "External id": 231100,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115539562.849, "dur": 13.255, + "args": { + "External id": 231101,"Record function id": 0, "Ev Idx": 1212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115539564.620, "dur": 10.850, + "args": { + "External id": 231102,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115539570.767, "dur": 4.273, + "args": { + "External id": 231103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115539573.300, "dur": 1.639, + "args": { + "External id": 231104,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539579.377, "dur": 9.100, + "args": { + "External id": 231105,"Record function id": 0, "Sequence number": 2757824, "Fwd thread id": 1, "Ev Idx": 1216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539581.123, "dur": 5.357, + "args": { + "External id": 231106,"Sequence number": 2757824, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1217 + } + }, + { + "ph": "f", "id": 132, "pid": 4183442, "tid": 31331, "ts": 667115539581.123, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539582.307, "dur": 4.025, + "args": { + "External id": 231107,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539585.183, "dur": 0.986, + "args": { + "External id": 231108,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539591.433, "dur": 150.353, + "args": { + "External id": 231109,"Record function id": 0, "Sequence number": 2757823, "Fwd thread id": 1, "Ev Idx": 1220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539592.744, "dur": 138.586, + "args": { + "External id": 231110,"Sequence number": 2757823, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1221 + } + }, + { + "ph": "f", "id": 133, "pid": 4183442, "tid": 31331, "ts": 667115539592.744, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539597.644, "dur": 3.215, + "args": { + "External id": 231111,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539598.483, "dur": 1.919, + "args": { + "External id": 231112,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539599.881, "dur": 0.406, + "args": { + "External id": 231113,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115539601.470, "dur": 39.379, + "args": { + "External id": 231114,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539642.067, "dur": 6.948, + "args": { + "External id": 231115,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539642.700, "dur": 5.529, + "args": { + "External id": 231116,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539645.856, "dur": 2.217, + "args": { + "External id": 231117,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539650.500, "dur": 38.677, + "args": { + "External id": 231118,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539651.759, "dur": 36.502, + "args": { + "External id": 231119,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539653.075, "dur": 34.460, + "args": { + "External id": 231120,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115539690.573, "dur": 39.693, + "args": { + "External id": 231121,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539748.086, "dur": 30.511, + "args": { + "External id": 231122,"Record function id": 0, "Sequence number": 2757822, "Fwd thread id": 1, "Ev Idx": 1233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539749.251, "dur": 6.612, + "args": { + "External id": 231123,"Sequence number": 2757822, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1234 + } + }, + { + "ph": "f", "id": 134, "pid": 4183442, "tid": 31331, "ts": 667115539749.251, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539751.245, "dur": 4.479, + "args": { + "External id": 231124,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539754.318, "dur": 1.257, + "args": { + "External id": 231125,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115539758.365, "dur": 17.852, + "args": { + "External id": 231126,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539781.934, "dur": 8.174, + "args": { + "External id": 231127,"Record function id": 0, "Sequence number": 2757821, "Fwd thread id": 1, "Ev Idx": 1238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115539783.026, "dur": 4.688, + "args": { + "External id": 231128,"Sequence number": 2757821, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1239 + } + }, + { + "ph": "f", "id": 135, "pid": 4183442, "tid": 31331, "ts": 667115539783.026, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115539783.833, "dur": 3.681, + "args": { + "External id": 231129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115539784.670, "dur": 2.287, + "args": { + "External id": 231130,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115539786.210, "dur": 0.653, + "args": { + "External id": 231131,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115539794.237, "dur": 6.482, + "args": { + "External id": 231132,"Record function id": 0, "Ev Idx": 1243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115539796.232, "dur": 3.926, + "args": { + "External id": 231133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115539797.241, "dur": 2.573, + "args": { + "External id": 231134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115539797.904, "dur": 1.801, + "args": { + "External id": 231135,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115539807.216, "dur": 348.454, + "args": { + "External id": 231136,"Record function id": 0, "Sequence number": 2757820, "Fwd thread id": 1, "Ev Idx": 1247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115539808.797, "dur": 318.054, + "args": { + "External id": 231137,"Sequence number": 2757820, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1248 + } + }, + { + "ph": "f", "id": 136, "pid": 4183442, "tid": 31331, "ts": 667115539808.797, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115539843.130, "dur": 2.424, + "args": { + "External id": 231138,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115539844.120, "dur": 1.249, + "args": { + "External id": 231139,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115539859.263, "dur": 5.728, + "args": { + "External id": 231140,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115539875.836, "dur": 3.016, + "args": { + "External id": 231141,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540025.951, "dur": 1.458, + "args": { + "External id": 231142,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115540031.649, "dur": 34.060, + "args": { + "External id": 231143,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540040.865, "dur": 0.887, + "args": { + "External id": 231144,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115540070.804, "dur": 31.613, + "args": { + "External id": 231145,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115540074.889, "dur": 27.320, + "args": { + "External id": 231146,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540079.126, "dur": 3.898, + "args": { + "External id": 231147,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115540084.359, "dur": 17.325, + "args": { + "External id": 231148,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115540106.995, "dur": 2.575, + "args": { + "External id": 231149,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540108.329, "dur": 1.107, + "args": { + "External id": 231150,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540115.808, "dur": 3.985, + "args": { + "External id": 231151,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540118.877, "dur": 0.823, + "args": { + "External id": 231152,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115540136.090, "dur": 14.970, + "args": { + "External id": 231153,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540164.626, "dur": 7.777, + "args": { + "External id": 231154,"Record function id": 0, "Ev Idx": 1265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540166.979, "dur": 4.736, + "args": { + "External id": 231155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115540168.332, "dur": 2.423, + "args": { + "External id": 231156,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115540169.166, "dur": 1.502, + "args": { + "External id": 231157,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540176.401, "dur": 7.506, + "args": { + "External id": 231158,"Record function id": 0, "Sequence number": 2757819, "Fwd thread id": 1, "Ev Idx": 1269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540177.911, "dur": 1.450, + "args": { + "External id": 231159,"Sequence number": 2757819, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1270 + } + }, + { + "ph": "f", "id": 137, "pid": 4183442, "tid": 31331, "ts": 667115540177.911, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115540187.822, "dur": 400.318, + "args": { + "External id": 231160,"Record function id": 0, "Sequence number": 2757818, "Fwd thread id": 1, "Ev Idx": 1271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115540189.605, "dur": 384.808, + "args": { + "External id": 231161,"Sequence number": 2757818, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1272 + } + }, + { + "ph": "f", "id": 138, "pid": 4183442, "tid": 31331, "ts": 667115540189.605, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540220.045, "dur": 8.012, + "args": { + "External id": 231162,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115540224.934, "dur": 2.841, + "args": { + "External id": 231163,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 1274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540230.872, "dur": 5.155, + "args": { + "External id": 231164,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540232.346, "dur": 3.091, + "args": { + "External id": 231165,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540234.410, "dur": 0.888, + "args": { + "External id": 231166,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 31331, + "ts": 667115540239.638, "dur": 77.267, + "args": { + "External id": 231167,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 1278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540242.348, "dur": 4.957, + "args": { + "External id": 231168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 1279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540243.202, "dur": 3.625, + "args": { + "External id": 231169,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540244.789, "dur": 1.954, + "args": { + "External id": 231170,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 31331, + "ts": 667115540248.359, "dur": 68.085, + "args": { + "External id": 231171,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 1282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115540249.879, "dur": 65.643, + "args": { + "External id": 231172,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 1283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115540319.990, "dur": 2.412, + "args": { + "External id": 231173,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 1284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540321.014, "dur": 1.251, + "args": { + "External id": 231174,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 1285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115540353.853, "dur": 4.500, + "args": { + "External id": 231175,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115540359.420, "dur": 1.876, + "args": { + "External id": 231176,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115540362.263, "dur": 1.662, + "args": { + "External id": 231177,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540395.729, "dur": 2.446, + "args": { + "External id": 231178,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540396.873, "dur": 1.078, + "args": { + "External id": 231179,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183442, "tid": 31331, + "ts": 667115540418.678, "dur": 135.697, + "args": { + "External id": 231180,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 1291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115540423.521, "dur": 7.341, + "args": { + "External id": 231181,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540427.493, "dur": 2.408, + "args": { + "External id": 231182,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115540432.531, "dur": 6.169, + "args": { + "External id": 231183,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 1294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540435.900, "dur": 2.009, + "args": { + "External id": 231184,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 1295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 31331, + "ts": 667115540439.871, "dur": 2.631, + "args": { + "External id": 231185,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 1296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540441.598, "dur": 0.518, + "args": { + "External id": 231186,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115540443.465, "dur": 3.383, + "args": { + "External id": 231187,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 1298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540445.713, "dur": 0.546, + "args": { + "External id": 231188,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 1299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115540450.575, "dur": 3.153, + "args": { + "External id": 231189,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 1300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540452.759, "dur": 0.625, + "args": { + "External id": 231190,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 1301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540454.793, "dur": 5.542, + "args": { + "External id": 231191,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 1302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183442, "tid": 31331, + "ts": 667115540458.303, "dur": 1.835, + "args": { + "External id": 231192,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 1303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115540462.933, "dur": 2.607, + "args": { + "External id": 231193,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 1304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540464.873, "dur": 0.391, + "args": { + "External id": 231194,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 1305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540466.466, "dur": 4.024, + "args": { + "External id": 231195,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 1306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540467.479, "dur": 2.907, + "args": { + "External id": 231196,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 1307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115540471.824, "dur": 66.720, + "args": { + "External id": 231197,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 1308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540541.702, "dur": 3.796, + "args": { + "External id": 231198,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 1309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183442, "tid": 31331, + "ts": 667115540546.429, "dur": 3.801, + "args": { + "External id": 231199,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 1310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540548.759, "dur": 0.749, + "args": { + "External id": 231200,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 1311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540552.435, "dur": 0.795, + "args": { + "External id": 231201,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 1312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540598.742, "dur": 9.324, + "args": { + "External id": 231202,"Record function id": 0, "Ev Idx": 1313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540601.268, "dur": 6.157, + "args": { + "External id": 231203,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115540603.192, "dur": 3.280, + "args": { + "External id": 231204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115540604.325, "dur": 2.032, + "args": { + "External id": 231205,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540612.092, "dur": 7.793, + "args": { + "External id": 231206,"Record function id": 0, "Sequence number": 2757817, "Fwd thread id": 1, "Ev Idx": 1317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540613.305, "dur": 4.018, + "args": { + "External id": 231207,"Sequence number": 2757817, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 1318 + } + }, + { + "ph": "f", "id": 139, "pid": 4183442, "tid": 31331, "ts": 667115540613.305, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540615.062, "dur": 2.075, + "args": { + "External id": 231208,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540616.210, "dur": 0.791, + "args": { + "External id": 231209,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540623.325, "dur": 155.449, + "args": { + "External id": 231210,"Record function id": 0, "Sequence number": 2757816, "Fwd thread id": 1, "Ev Idx": 1321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540624.299, "dur": 146.297, + "args": { + "External id": 231211,"Sequence number": 2757816, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1322 + } + }, + { + "ph": "f", "id": 140, "pid": 4183442, "tid": 31331, "ts": 667115540624.299, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540630.586, "dur": 4.216, + "args": { + "External id": 231212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540631.814, "dur": 2.421, + "args": { + "External id": 231213,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 1324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540633.567, "dur": 0.545, + "args": { + "External id": 231214,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115540635.970, "dur": 75.909, + "args": { + "External id": 231215,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 1326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540714.046, "dur": 6.715, + "args": { + "External id": 231216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540715.079, "dur": 4.648, + "args": { + "External id": 231217,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540718.348, "dur": 1.224, + "args": { + "External id": 231218,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540722.572, "dur": 4.583, + "args": { + "External id": 231219,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540723.996, "dur": 2.577, + "args": { + "External id": 231220,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540725.798, "dur": 0.700, + "args": { + "External id": 231221,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115540727.876, "dur": 41.633, + "args": { + "External id": 231222,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540785.207, "dur": 9.024, + "args": { + "External id": 231223,"Record function id": 0, "Sequence number": 2757815, "Fwd thread id": 1, "Ev Idx": 1334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540786.432, "dur": 6.391, + "args": { + "External id": 231224,"Sequence number": 2757815, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1335 + } + }, + { + "ph": "f", "id": 141, "pid": 4183442, "tid": 31331, "ts": 667115540786.432, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540788.338, "dur": 4.313, + "args": { + "External id": 231225,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540790.980, "dur": 1.573, + "args": { + "External id": 231226,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540798.170, "dur": 7.955, + "args": { + "External id": 231227,"Record function id": 0, "Sequence number": 2757814, "Fwd thread id": 1, "Ev Idx": 1338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540799.326, "dur": 4.670, + "args": { + "External id": 231228,"Sequence number": 2757814, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1339 + } + }, + { + "ph": "f", "id": 142, "pid": 4183442, "tid": 31331, "ts": 667115540799.326, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540800.010, "dur": 3.765, + "args": { + "External id": 231229,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540800.702, "dur": 2.549, + "args": { + "External id": 231230,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540802.561, "dur": 0.592, + "args": { + "External id": 231231,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540810.315, "dur": 6.974, + "args": { + "External id": 231232,"Record function id": 0, "Ev Idx": 1343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540812.469, "dur": 4.304, + "args": { + "External id": 231233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115540813.735, "dur": 2.700, + "args": { + "External id": 231234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115540815.183, "dur": 1.161, + "args": { + "External id": 231235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540820.761, "dur": 8.719, + "args": { + "External id": 231236,"Record function id": 0, "Sequence number": 2757813, "Fwd thread id": 1, "Ev Idx": 1347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540822.249, "dur": 4.908, + "args": { + "External id": 231237,"Sequence number": 2757813, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 1348 + } + }, + { + "ph": "f", "id": 143, "pid": 4183442, "tid": 31331, "ts": 667115540822.249, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540825.477, "dur": 1.536, + "args": { + "External id": 231238,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540826.251, "dur": 0.624, + "args": { + "External id": 231239,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540832.621, "dur": 92.898, + "args": { + "External id": 231240,"Record function id": 0, "Sequence number": 2757812, "Fwd thread id": 1, "Ev Idx": 1351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540833.596, "dur": 82.597, + "args": { + "External id": 231241,"Sequence number": 2757812, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1352 + } + }, + { + "ph": "f", "id": 144, "pid": 4183442, "tid": 31331, "ts": 667115540833.596, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540836.213, "dur": 4.399, + "args": { + "External id": 231242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540836.621, "dur": 3.467, + "args": { + "External id": 231243,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 1354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540839.204, "dur": 0.747, + "args": { + "External id": 231244,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115540841.188, "dur": 28.066, + "args": { + "External id": 231245,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 1356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540870.369, "dur": 4.173, + "args": { + "External id": 231246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540870.968, "dur": 2.948, + "args": { + "External id": 231247,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540872.707, "dur": 1.070, + "args": { + "External id": 231248,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540875.884, "dur": 6.748, + "args": { + "External id": 231249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540877.477, "dur": 4.724, + "args": { + "External id": 231250,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540880.001, "dur": 2.113, + "args": { + "External id": 231251,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115540883.269, "dur": 32.319, + "args": { + "External id": 231252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540931.823, "dur": 31.353, + "args": { + "External id": 231253,"Record function id": 0, "Sequence number": 2757811, "Fwd thread id": 1, "Ev Idx": 1364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540932.897, "dur": 4.771, + "args": { + "External id": 231254,"Sequence number": 2757811, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1365 + } + }, + { + "ph": "f", "id": 145, "pid": 4183442, "tid": 31331, "ts": 667115540932.897, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115540934.898, "dur": 2.630, + "args": { + "External id": 231255,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115540936.124, "dur": 1.273, + "args": { + "External id": 231256,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115540940.464, "dur": 19.851, + "args": { + "External id": 231257,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540966.850, "dur": 10.393, + "args": { + "External id": 231258,"Record function id": 0, "Sequence number": 2757810, "Fwd thread id": 1, "Ev Idx": 1369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115540968.109, "dur": 7.167, + "args": { + "External id": 231259,"Sequence number": 2757810, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1370 + } + }, + { + "ph": "f", "id": 146, "pid": 4183442, "tid": 31331, "ts": 667115540968.109, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115540969.154, "dur": 5.892, + "args": { + "External id": 231260,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115540969.969, "dur": 4.578, + "args": { + "External id": 231261,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115540973.575, "dur": 0.866, + "args": { + "External id": 231262,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540981.108, "dur": 5.923, + "args": { + "External id": 231263,"Record function id": 0, "Ev Idx": 1374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115540982.895, "dur": 3.608, + "args": { + "External id": 231264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115540983.954, "dur": 2.106, + "args": { + "External id": 231265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115540984.516, "dur": 1.469, + "args": { + "External id": 231266,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115540991.205, "dur": 403.541, + "args": { + "External id": 231267,"Record function id": 0, "Sequence number": 2757809, "Fwd thread id": 1, "Ev Idx": 1378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115540996.828, "dur": 362.642, + "args": { + "External id": 231268,"Sequence number": 2757809, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 1379 + } + }, + { + "ph": "f", "id": 147, "pid": 4183442, "tid": 31331, "ts": 667115540996.828, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 31331, + "ts": 667115541020.246, "dur": 34.957, + "args": { + "External id": 231269,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115541021.859, "dur": 33.071, + "args": { + "External id": 231270,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115541024.557, "dur": 6.762, + "args": { + "External id": 231271,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 1382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115541027.605, "dur": 3.207, + "args": { + "External id": 231272,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115541032.512, "dur": 21.851, + "args": { + "External id": 231273,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115541068.463, "dur": 2.369, + "args": { + "External id": 231274,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541069.385, "dur": 1.291, + "args": { + "External id": 231275,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115541074.931, "dur": 2.959, + "args": { + "External id": 231276,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541075.498, "dur": 2.296, + "args": { + "External id": 231277,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115541090.744, "dur": 2.504, + "args": { + "External id": 231278,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115541104.216, "dur": 3.457, + "args": { + "External id": 231279,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541257.777, "dur": 3.619, + "args": { + "External id": 231280,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115541265.542, "dur": 29.492, + "args": { + "External id": 231281,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541273.336, "dur": 0.612, + "args": { + "External id": 231282,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115541300.259, "dur": 27.720, + "args": { + "External id": 231283,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115541301.887, "dur": 25.887, + "args": { + "External id": 231284,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541306.742, "dur": 3.751, + "args": { + "External id": 231285,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115541313.217, "dur": 13.937, + "args": { + "External id": 231286,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115541331.798, "dur": 2.454, + "args": { + "External id": 231287,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541333.062, "dur": 1.044, + "args": { + "External id": 231288,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115541341.408, "dur": 2.753, + "args": { + "External id": 231289,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541342.613, "dur": 1.415, + "args": { + "External id": 231290,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115541346.823, "dur": 4.149, + "args": { + "External id": 231291,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541347.963, "dur": 2.915, + "args": { + "External id": 231292,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115541378.157, "dur": 15.063, + "args": { + "External id": 231293,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115541403.924, "dur": 8.371, + "args": { + "External id": 231294,"Record function id": 0, "Ev Idx": 1405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115541406.582, "dur": 5.005, + "args": { + "External id": 231295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115541407.970, "dur": 2.603, + "args": { + "External id": 231296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115541409.079, "dur": 1.396, + "args": { + "External id": 231297,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541416.109, "dur": 9.476, + "args": { + "External id": 231298,"Record function id": 0, "Sequence number": 2757808, "Fwd thread id": 1, "Ev Idx": 1409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541417.543, "dur": 4.807, + "args": { + "External id": 231299,"Sequence number": 2757808, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1410 + } + }, + { + "ph": "f", "id": 148, "pid": 4183442, "tid": 31331, "ts": 667115541417.543, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115541419.723, "dur": 2.428, + "args": { + "External id": 231300,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541420.763, "dur": 1.237, + "args": { + "External id": 231301,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541430.582, "dur": 155.286, + "args": { + "External id": 231302,"Record function id": 0, "Sequence number": 2757807, "Fwd thread id": 1, "Ev Idx": 1413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541431.728, "dur": 145.214, + "args": { + "External id": 231303,"Sequence number": 2757807, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1414 + } + }, + { + "ph": "f", "id": 149, "pid": 4183442, "tid": 31331, "ts": 667115541431.728, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115541435.607, "dur": 4.540, + "args": { + "External id": 231304,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115541437.075, "dur": 2.539, + "args": { + "External id": 231305,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541438.571, "dur": 0.871, + "args": { + "External id": 231306,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115541441.197, "dur": 78.225, + "args": { + "External id": 231307,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115541521.849, "dur": 8.148, + "args": { + "External id": 231308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115541524.710, "dur": 4.423, + "args": { + "External id": 231309,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541527.004, "dur": 1.965, + "args": { + "External id": 231310,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115541531.749, "dur": 4.611, + "args": { + "External id": 231311,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115541533.183, "dur": 2.533, + "args": { + "External id": 231312,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541535.221, "dur": 0.396, + "args": { + "External id": 231313,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115541536.907, "dur": 39.326, + "args": { + "External id": 231314,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541592.425, "dur": 12.229, + "args": { + "External id": 231315,"Record function id": 0, "Sequence number": 2757806, "Fwd thread id": 1, "Ev Idx": 1426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541593.447, "dur": 8.216, + "args": { + "External id": 231316,"Sequence number": 2757806, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1427 + } + }, + { + "ph": "f", "id": 150, "pid": 4183442, "tid": 31331, "ts": 667115541593.447, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115541597.044, "dur": 4.472, + "args": { + "External id": 231317,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541598.504, "dur": 2.867, + "args": { + "External id": 231318,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541608.153, "dur": 7.355, + "args": { + "External id": 231319,"Record function id": 0, "Sequence number": 2757805, "Fwd thread id": 1, "Ev Idx": 1430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541609.037, "dur": 4.537, + "args": { + "External id": 231320,"Sequence number": 2757805, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1431 + } + }, + { + "ph": "f", "id": 151, "pid": 4183442, "tid": 31331, "ts": 667115541609.037, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115541609.850, "dur": 3.531, + "args": { + "External id": 231321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115541610.401, "dur": 2.537, + "args": { + "External id": 231322,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541612.216, "dur": 0.570, + "args": { + "External id": 231323,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115541619.760, "dur": 8.232, + "args": { + "External id": 231324,"Record function id": 0, "Ev Idx": 1435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115541621.471, "dur": 5.990, + "args": { + "External id": 231325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115541622.855, "dur": 4.220, + "args": { + "External id": 231326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115541625.672, "dur": 1.272, + "args": { + "External id": 231327,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541630.948, "dur": 6.616, + "args": { + "External id": 231328,"Record function id": 0, "Sequence number": 2757804, "Fwd thread id": 1, "Ev Idx": 1439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115541631.868, "dur": 3.558, + "args": { + "External id": 231329,"Sequence number": 2757804, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1440 + } + }, + { + "ph": "f", "id": 152, "pid": 4183442, "tid": 31331, "ts": 667115541631.868, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115541633.080, "dur": 2.202, + "args": { + "External id": 231330,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115541633.981, "dur": 1.154, + "args": { + "External id": 231331,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115541641.993, "dur": 320.364, + "args": { + "External id": 231332,"Record function id": 0, "Sequence number": 2757803, "Fwd thread id": 1, "Ev Idx": 1443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183442, "tid": 31331, + "ts": 667115541643.851, "dur": 297.041, + "args": { + "External id": 231333,"Sequence number": 2757803, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1444 + } + }, + { + "ph": "f", "id": 153, "pid": 4183442, "tid": 31331, "ts": 667115541643.851, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115541693.919, "dur": 9.226, + "args": { + "External id": 231334,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541696.860, "dur": 5.695, + "args": { + "External id": 231335,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115541705.338, "dur": 3.525, + "args": { + "External id": 231336,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541706.828, "dur": 1.819, + "args": { + "External id": 231337,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115541710.398, "dur": 3.974, + "args": { + "External id": 231338,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541712.542, "dur": 1.626, + "args": { + "External id": 231339,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115541738.075, "dur": 177.143, + "args": { + "External id": 231340,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115541816.088, "dur": 4.597, + "args": { + "External id": 231341,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115541822.528, "dur": 3.559, + "args": { + "External id": 231342,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115541927.682, "dur": 3.865, + "args": { + "External id": 231343,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115541934.764, "dur": 0.646, + "args": { + "External id": 231344,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 31331, + "ts": 667115541937.460, "dur": 0.658, + "args": { + "External id": 231345,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115541972.239, "dur": 223.617, + "args": { + "External id": 231346,"Record function id": 0, "Sequence number": 2757802, "Fwd thread id": 1, "Ev Idx": 1457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115541974.556, "dur": 214.237, + "args": { + "External id": 231347,"Sequence number": 2757802, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1458 + } + }, + { + "ph": "f", "id": 154, "pid": 4183442, "tid": 31331, "ts": 667115541974.556, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115541994.308, "dur": 48.036, + "args": { + "External id": 231348,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115541997.354, "dur": 2.692, + "args": { + "External id": 231349,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115542001.535, "dur": 40.204, + "args": { + "External id": 231350,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115542052.037, "dur": 4.168, + "args": { + "External id": 231351,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542053.895, "dur": 2.055, + "args": { + "External id": 231352,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115542203.051, "dur": 145.813, + "args": { + "External id": 231353,"Record function id": 0, "Sequence number": 2757801, "Fwd thread id": 1, "Ev Idx": 1464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115542205.252, "dur": 136.720, + "args": { + "External id": 231354,"Sequence number": 2757801, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1465 + } + }, + { + "ph": "f", "id": 155, "pid": 4183442, "tid": 31331, "ts": 667115542205.252, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 31331, + "ts": 667115542216.069, "dur": 31.590, + "args": { + "External id": 231355,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542218.301, "dur": 2.426, + "args": { + "External id": 231356,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115542221.524, "dur": 25.452, + "args": { + "External id": 231357,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 31331, + "ts": 667115542254.051, "dur": 4.162, + "args": { + "External id": 231358,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542255.731, "dur": 2.149, + "args": { + "External id": 231359,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542354.648, "dur": 16.567, + "args": { + "External id": 231360,"Record function id": 0, "Sequence number": 2757800, "Fwd thread id": 1, "Ev Idx": 1471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542356.028, "dur": 12.110, + "args": { + "External id": 231361,"Sequence number": 2757800, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1472 + } + }, + { + "ph": "f", "id": 156, "pid": 4183442, "tid": 31331, "ts": 667115542356.028, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542360.350, "dur": 7.524, + "args": { + "External id": 231362,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542362.101, "dur": 5.610, + "args": { + "External id": 231363,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542374.577, "dur": 7.201, + "args": { + "External id": 231364,"Record function id": 0, "Sequence number": 2757799, "Fwd thread id": 1, "Ev Idx": 1475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542375.367, "dur": 3.495, + "args": { + "External id": 231365,"Sequence number": 2757799, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1476 + } + }, + { + "ph": "f", "id": 157, "pid": 4183442, "tid": 31331, "ts": 667115542375.367, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542376.848, "dur": 1.880, + "args": { + "External id": 231366,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542377.768, "dur": 0.812, + "args": { + "External id": 231367,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542385.034, "dur": 6.652, + "args": { + "External id": 231368,"Record function id": 0, "Sequence number": 2757798, "Fwd thread id": 1, "Ev Idx": 1479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542385.790, "dur": 3.538, + "args": { + "External id": 231369,"Sequence number": 2757798, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1480 + } + }, + { + "ph": "f", "id": 158, "pid": 4183442, "tid": 31331, "ts": 667115542385.790, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542387.496, "dur": 1.692, + "args": { + "External id": 231370,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542388.319, "dur": 0.744, + "args": { + "External id": 231371,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542394.856, "dur": 8.343, + "args": { + "External id": 231372,"Record function id": 0, "Sequence number": 2757797, "Fwd thread id": 1, "Ev Idx": 1483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542395.949, "dur": 4.826, + "args": { + "External id": 231373,"Sequence number": 2757797, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1484 + } + }, + { + "ph": "f", "id": 159, "pid": 4183442, "tid": 31331, "ts": 667115542395.949, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542398.835, "dur": 1.806, + "args": { + "External id": 231374,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542399.522, "dur": 0.978, + "args": { + "External id": 231375,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542406.719, "dur": 186.544, + "args": { + "External id": 231376,"Record function id": 0, "Sequence number": 2757796, "Fwd thread id": 1, "Ev Idx": 1487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542407.876, "dur": 176.720, + "args": { + "External id": 231377,"Sequence number": 2757796, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1488 + } + }, + { + "ph": "f", "id": 160, "pid": 4183442, "tid": 31331, "ts": 667115542407.876, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542412.243, "dur": 7.655, + "args": { + "External id": 231378,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542414.052, "dur": 5.274, + "args": { + "External id": 231379,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542417.565, "dur": 1.490, + "args": { + "External id": 231380,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115542421.328, "dur": 100.667, + "args": { + "External id": 231381,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542524.581, "dur": 6.068, + "args": { + "External id": 231382,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542525.545, "dur": 4.100, + "args": { + "External id": 231383,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542528.071, "dur": 1.367, + "args": { + "External id": 231384,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542532.567, "dur": 4.883, + "args": { + "External id": 231385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542534.031, "dur": 2.938, + "args": { + "External id": 231386,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542536.401, "dur": 0.490, + "args": { + "External id": 231387,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115542538.262, "dur": 45.420, + "args": { + "External id": 231388,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542600.148, "dur": 8.152, + "args": { + "External id": 231389,"Record function id": 0, "Sequence number": 2757795, "Fwd thread id": 1, "Ev Idx": 1500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542601.268, "dur": 5.290, + "args": { + "External id": 231390,"Sequence number": 2757795, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1501 + } + }, + { + "ph": "f", "id": 161, "pid": 4183442, "tid": 31331, "ts": 667115542601.268, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542603.145, "dur": 3.236, + "args": { + "External id": 231391,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542604.631, "dur": 1.608, + "args": { + "External id": 231392,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542611.729, "dur": 9.733, + "args": { + "External id": 231393,"Record function id": 0, "Sequence number": 2757794, "Fwd thread id": 1, "Ev Idx": 1504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542612.789, "dur": 6.180, + "args": { + "External id": 231394,"Sequence number": 2757794, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1505 + } + }, + { + "ph": "f", "id": 162, "pid": 4183442, "tid": 31331, "ts": 667115542612.789, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542613.668, "dur": 5.070, + "args": { + "External id": 231395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542615.905, "dur": 2.260, + "args": { + "External id": 231396,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542617.430, "dur": 0.579, + "args": { + "External id": 231397,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115542627.314, "dur": 9.541, + "args": { + "External id": 231398,"Record function id": 0, "Ev Idx": 1509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115542629.320, "dur": 6.898, + "args": { + "External id": 231399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115542632.013, "dur": 3.737, + "args": { + "External id": 231400,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115542633.252, "dur": 2.368, + "args": { + "External id": 231401,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542640.398, "dur": 6.897, + "args": { + "External id": 231402,"Record function id": 0, "Sequence number": 2757793, "Fwd thread id": 1, "Ev Idx": 1513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542642.002, "dur": 3.145, + "args": { + "External id": 231403,"Sequence number": 2757793, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1514 + } + }, + { + "ph": "f", "id": 163, "pid": 4183442, "tid": 31331, "ts": 667115542642.002, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542643.193, "dur": 1.822, + "args": { + "External id": 231404,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542643.991, "dur": 0.889, + "args": { + "External id": 231405,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542652.104, "dur": 146.201, + "args": { + "External id": 231406,"Record function id": 0, "Sequence number": 2757792, "Fwd thread id": 1, "Ev Idx": 1517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542689.578, "dur": 100.823, + "args": { + "External id": 231407,"Sequence number": 2757792, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1518 + } + }, + { + "ph": "f", "id": 164, "pid": 4183442, "tid": 31331, "ts": 667115542689.578, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542693.611, "dur": 4.659, + "args": { + "External id": 231408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542694.364, "dur": 3.274, + "args": { + "External id": 231409,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542696.712, "dur": 0.664, + "args": { + "External id": 231410,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115542699.009, "dur": 43.465, + "args": { + "External id": 231411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542743.583, "dur": 6.020, + "args": { + "External id": 231412,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542744.409, "dur": 4.541, + "args": { + "External id": 231413,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542747.857, "dur": 0.974, + "args": { + "External id": 231414,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542750.764, "dur": 4.917, + "args": { + "External id": 231415,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542752.037, "dur": 3.176, + "args": { + "External id": 231416,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542753.296, "dur": 1.840, + "args": { + "External id": 231417,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115542756.335, "dur": 33.323, + "args": { + "External id": 231418,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542806.059, "dur": 45.772, + "args": { + "External id": 231419,"Record function id": 0, "Sequence number": 2757791, "Fwd thread id": 1, "Ev Idx": 1530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542807.480, "dur": 9.573, + "args": { + "External id": 231420,"Sequence number": 2757791, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1531 + } + }, + { + "ph": "f", "id": 165, "pid": 4183442, "tid": 31331, "ts": 667115542807.480, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542811.450, "dur": 5.460, + "args": { + "External id": 231421,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542815.458, "dur": 1.359, + "args": { + "External id": 231422,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 31331, + "ts": 667115542820.286, "dur": 28.833, + "args": { + "External id": 231423,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542855.592, "dur": 31.089, + "args": { + "External id": 231424,"Record function id": 0, "Sequence number": 2757790, "Fwd thread id": 1, "Ev Idx": 1535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542877.687, "dur": 6.785, + "args": { + "External id": 231425,"Sequence number": 2757790, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1536 + } + }, + { + "ph": "f", "id": 166, "pid": 4183442, "tid": 31331, "ts": 667115542877.687, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542878.488, "dur": 5.790, + "args": { + "External id": 231426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542879.354, "dur": 4.395, + "args": { + "External id": 231427,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542882.970, "dur": 0.631, + "args": { + "External id": 231428,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115542891.320, "dur": 5.992, + "args": { + "External id": 231429,"Record function id": 0, "Ev Idx": 1540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115542892.874, "dur": 3.889, + "args": { + "External id": 231430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115542893.899, "dur": 2.317, + "args": { + "External id": 231431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115542894.760, "dur": 1.364, + "args": { + "External id": 231432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542900.838, "dur": 6.477, + "args": { + "External id": 231433,"Record function id": 0, "Sequence number": 2757789, "Fwd thread id": 1, "Ev Idx": 1544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542902.375, "dur": 2.762, + "args": { + "External id": 231434,"Sequence number": 2757789, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1545 + } + }, + { + "ph": "f", "id": 167, "pid": 4183442, "tid": 31331, "ts": 667115542902.375, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115542903.420, "dur": 1.583, + "args": { + "External id": 231435,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115542904.073, "dur": 0.792, + "args": { + "External id": 231436,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542910.736, "dur": 97.632, + "args": { + "External id": 231437,"Record function id": 0, "Sequence number": 2757788, "Fwd thread id": 1, "Ev Idx": 1548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115542911.620, "dur": 87.722, + "args": { + "External id": 231438,"Sequence number": 2757788, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1549 + } + }, + { + "ph": "f", "id": 168, "pid": 4183442, "tid": 31331, "ts": 667115542911.620, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542916.863, "dur": 2.708, + "args": { + "External id": 231439,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542917.316, "dur": 1.775, + "args": { + "External id": 231440,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542918.489, "dur": 0.479, + "args": { + "External id": 231441,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115542920.133, "dur": 36.017, + "args": { + "External id": 231442,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542957.155, "dur": 5.329, + "args": { + "External id": 231443,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542957.778, "dur": 4.158, + "args": { + "External id": 231444,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542961.284, "dur": 0.536, + "args": { + "External id": 231445,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115542964.066, "dur": 3.317, + "args": { + "External id": 231446,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115542965.273, "dur": 1.685, + "args": { + "External id": 231447,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115542966.495, "dur": 0.374, + "args": { + "External id": 231448,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115542967.979, "dur": 30.473, + "args": { + "External id": 231449,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115543012.677, "dur": 24.602, + "args": { + "External id": 231450,"Record function id": 0, "Sequence number": 2757787, "Fwd thread id": 1, "Ev Idx": 1561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115543013.574, "dur": 3.894, + "args": { + "External id": 231451,"Sequence number": 2757787, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1562 + } + }, + { + "ph": "f", "id": 169, "pid": 4183442, "tid": 31331, "ts": 667115543013.574, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115543015.211, "dur": 2.095, + "args": { + "External id": 231452,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115543016.293, "dur": 0.915, + "args": { + "External id": 231453,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115543019.602, "dur": 15.085, + "args": { + "External id": 231454,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115543040.762, "dur": 8.662, + "args": { + "External id": 231455,"Record function id": 0, "Sequence number": 2757786, "Fwd thread id": 1, "Ev Idx": 1566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183442, "tid": 31331, + "ts": 667115543043.622, "dur": 4.117, + "args": { + "External id": 231456,"Sequence number": 2757786, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1567 + } + }, + { + "ph": "f", "id": 170, "pid": 4183442, "tid": 31331, "ts": 667115543043.622, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 31331, + "ts": 667115543044.373, "dur": 3.135, + "args": { + "External id": 231457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 31331, + "ts": 667115543044.858, "dur": 2.178, + "args": { + "External id": 231458,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543046.385, "dur": 0.562, + "args": { + "External id": 231459,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115543053.326, "dur": 4.852, + "args": { + "External id": 231460,"Record function id": 0, "Ev Idx": 1571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115543055.158, "dur": 2.429, + "args": { + "External id": 231461,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115543055.951, "dur": 1.352, + "args": { + "External id": 231462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115543056.357, "dur": 0.835, + "args": { + "External id": 231463,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115543062.153, "dur": 347.437, + "args": { + "External id": 231464,"Record function id": 0, "Sequence number": 2757785, "Fwd thread id": 1, "Ev Idx": 1575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115543063.560, "dur": 310.936, + "args": { + "External id": 231465,"Sequence number": 2757785, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1576 + } + }, + { + "ph": "f", "id": 171, "pid": 4183442, "tid": 31331, "ts": 667115543063.560, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115543095.904, "dur": 3.609, + "args": { + "External id": 231466,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115543098.304, "dur": 1.056, + "args": { + "External id": 231467,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115543114.283, "dur": 5.594, + "args": { + "External id": 231468,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115543129.808, "dur": 3.230, + "args": { + "External id": 231469,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115543274.867, "dur": 1.760, + "args": { + "External id": 231470,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 31331, + "ts": 667115543280.982, "dur": 35.032, + "args": { + "External id": 231471,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543290.846, "dur": 0.828, + "args": { + "External id": 231472,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115543321.598, "dur": 31.141, + "args": { + "External id": 231473,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115543325.236, "dur": 27.297, + "args": { + "External id": 231474,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543329.117, "dur": 3.742, + "args": { + "External id": 231475,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115543334.246, "dur": 17.693, + "args": { + "External id": 231476,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 31331, + "ts": 667115543357.045, "dur": 2.551, + "args": { + "External id": 231477,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115543358.513, "dur": 0.954, + "args": { + "External id": 231478,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 31331, + "ts": 667115543365.645, "dur": 2.525, + "args": { + "External id": 231479,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115543366.789, "dur": 1.273, + "args": { + "External id": 231480,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 31331, + "ts": 667115543388.326, "dur": 16.593, + "args": { + "External id": 231481,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115543418.327, "dur": 7.541, + "args": { + "External id": 231482,"Record function id": 0, "Ev Idx": 1593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115543420.378, "dur": 4.868, + "args": { + "External id": 231483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115543422.289, "dur": 2.137, + "args": { + "External id": 231484,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115543422.942, "dur": 1.380, + "args": { + "External id": 231485,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115543430.650, "dur": 2708.289, + "args": { + "External id": 231486,"Record function id": 0, "Ev Idx": 1597 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.19)", "pid": 4183442, "tid": 31331, + "ts": 667115543462.648, "dur": 998.222, + "args": { + "External id": 231487,"Record function id": 0, "Ev Idx": 1598 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.18", "pid": 4183442, "tid": 31331, + "ts": 667115543487.724, "dur": 965.326, + "args": { + "External id": 231488,"Record function id": 0, "Ev Idx": 1599 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 4183442, "tid": 31331, + "ts": 667115543525.092, "dur": 913.370, + "args": { + "External id": 231489,"Record function id": 0, "Ev Idx": 1600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115543615.669, "dur": 7.928, + "args": { + "External id": 231490,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115543641.014, "dur": 68.788, + "args": { + "External id": 231491,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543645.361, "dur": 1.466, + "args": { + "External id": 231492,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543648.963, "dur": 2.235, + "args": { + "External id": 231493,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543688.780, "dur": 0.658, + "args": { + "External id": 231494,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543691.367, "dur": 0.315, + "args": { + "External id": 231495,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543693.427, "dur": 0.310, + "args": { + "External id": 231496,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543696.115, "dur": 0.572, + "args": { + "External id": 231497,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543697.916, "dur": 0.347, + "args": { + "External id": 231498,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543699.376, "dur": 1.211, + "args": { + "External id": 231499,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543702.058, "dur": 0.637, + "args": { + "External id": 231500,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115543727.106, "dur": 38.665, + "args": { + "External id": 231501,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115543810.475, "dur": 115.898, + "args": { + "External id": 231502,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 1613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115543822.469, "dur": 5.612, + "args": { + "External id": 231503,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115543834.583, "dur": 12.510, + "args": { + "External id": 231504,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115543840.861, "dur": 5.846, + "args": { + "External id": 231505,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 1616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543844.786, "dur": 0.790, + "args": { + "External id": 231506,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115543854.496, "dur": 27.868, + "args": { + "External id": 231507,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543856.984, "dur": 0.540, + "args": { + "External id": 231508,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543859.163, "dur": 1.454, + "args": { + "External id": 231509,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543862.415, "dur": 0.288, + "args": { + "External id": 231510,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543863.907, "dur": 0.410, + "args": { + "External id": 231511,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543866.899, "dur": 0.317, + "args": { + "External id": 231512,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543868.608, "dur": 0.239, + "args": { + "External id": 231513,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543870.339, "dur": 2.034, + "args": { + "External id": 231514,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543875.046, "dur": 0.323, + "args": { + "External id": 231515,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115543876.685, "dur": 0.301, + "args": { + "External id": 231516,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115543893.789, "dur": 24.408, + "args": { + "External id": 231517,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115543986.665, "dur": 354.621, + "args": { + "External id": 231518,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 1629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115544019.067, "dur": 317.569, + "args": { + "External id": 231519,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1630, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115544030.525, "dur": 300.437, + "args": { + "External id": 231520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 1631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115544362.465, "dur": 2.413, + "args": { + "External id": 231521,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1632, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115544469.279, "dur": 1646.369, + "args": { + "External id": 231522,"Sequence number": 2757784, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1633 + } + }, + { + "ph": "f", "id": 172, "pid": 4183442, "tid": 31331, "ts": 667115544469.279, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115544618.360, "dur": 141.447, + "args": { + "External id": 231523,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 1634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115544807.067, "dur": 39.962, + "args": { + "External id": 231524,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 1635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115544867.374, "dur": 44.114, + "args": { + "External id": 231525,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 1636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115544920.885, "dur": 28.741, + "args": { + "External id": 231526,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115544955.968, "dur": 33.267, + "args": { + "External id": 231527,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115544998.177, "dur": 22.409, + "args": { + "External id": 231528,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545028.586, "dur": 28.213, + "args": { + "External id": 231529,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115545081.528, "dur": 22.102, + "args": { + "External id": 231530,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 1641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115545124.658, "dur": 29.158, + "args": { + "External id": 231531,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115545175.422, "dur": 19.604, + "args": { + "External id": 231532,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115545209.549, "dur": 15.181, + "args": { + "External id": 231533,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545236.113, "dur": 36.913, + "args": { + "External id": 231534,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545276.041, "dur": 29.983, + "args": { + "External id": 231535,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115545335.502, "dur": 191.864, + "args": { + "External id": 231536,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115545411.597, "dur": 5.893, + "args": { + "External id": 231537,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115545419.342, "dur": 4.641, + "args": { + "External id": 231538,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115545565.323, "dur": 28.125, + "args": { + "External id": 231539,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115545605.768, "dur": 14.129, + "args": { + "External id": 231540,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545630.442, "dur": 84.225, + "args": { + "External id": 231541,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545723.694, "dur": 34.606, + "args": { + "External id": 231542,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545765.947, "dur": 28.105, + "args": { + "External id": 231543,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545801.022, "dur": 28.486, + "args": { + "External id": 231544,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545834.671, "dur": 26.278, + "args": { + "External id": 231545,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115545868.467, "dur": 28.643, + "args": { + "External id": 231546,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115545917.417, "dur": 23.509, + "args": { + "External id": 231547,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 1658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115545961.349, "dur": 25.137, + "args": { + "External id": 231548,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115546006.555, "dur": 17.798, + "args": { + "External id": 231549,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115546039.908, "dur": 14.387, + "args": { + "External id": 231550,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115546070.631, "dur": 16.084, + "args": { + "External id": 231551,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 1662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546160.403, "dur": 15.468, + "args": { + "External id": 231552,"Record function id": 0, "Ev Idx": 1663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546164.179, "dur": 10.924, + "args": { + "External id": 231553,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546168.365, "dur": 5.589, + "args": { + "External id": 231554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546169.959, "dur": 3.888, + "args": { + "External id": 231555,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546179.868, "dur": 4.703, + "args": { + "External id": 231556,"Record function id": 0, "Ev Idx": 1667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546181.641, "dur": 2.435, + "args": { + "External id": 231557,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546182.385, "dur": 1.240, + "args": { + "External id": 231558,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546182.892, "dur": 0.642, + "args": { + "External id": 231559,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546187.851, "dur": 5.052, + "args": { + "External id": 231560,"Record function id": 0, "Ev Idx": 1671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546189.545, "dur": 2.877, + "args": { + "External id": 231561,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546190.274, "dur": 1.668, + "args": { + "External id": 231562,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546191.045, "dur": 0.819, + "args": { + "External id": 231563,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546196.238, "dur": 5.502, + "args": { + "External id": 231564,"Record function id": 0, "Ev Idx": 1675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546197.430, "dur": 3.886, + "args": { + "External id": 231565,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546197.986, "dur": 2.905, + "args": { + "External id": 231566,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546198.321, "dur": 2.478, + "args": { + "External id": 231567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546204.978, "dur": 6.214, + "args": { + "External id": 231568,"Record function id": 0, "Ev Idx": 1679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546206.362, "dur": 4.398, + "args": { + "External id": 231569,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546207.048, "dur": 3.332, + "args": { + "External id": 231570,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546209.303, "dur": 0.932, + "args": { + "External id": 231571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546214.467, "dur": 3.660, + "args": { + "External id": 231572,"Record function id": 0, "Ev Idx": 1683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546215.614, "dur": 2.109, + "args": { + "External id": 231573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546216.235, "dur": 1.065, + "args": { + "External id": 231574,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546216.682, "dur": 0.536, + "args": { + "External id": 231575,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546221.435, "dur": 3.803, + "args": { + "External id": 231576,"Record function id": 0, "Ev Idx": 1687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546222.813, "dur": 2.011, + "args": { + "External id": 231577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546223.291, "dur": 1.150, + "args": { + "External id": 231578,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546223.708, "dur": 0.657, + "args": { + "External id": 231579,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546228.265, "dur": 3.845, + "args": { + "External id": 231580,"Record function id": 0, "Ev Idx": 1691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546229.586, "dur": 2.109, + "args": { + "External id": 231581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546230.196, "dur": 1.103, + "args": { + "External id": 231582,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546230.499, "dur": 0.727, + "args": { + "External id": 231583,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546235.972, "dur": 5.560, + "args": { + "External id": 231584,"Record function id": 0, "Ev Idx": 1695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115546237.490, "dur": 3.588, + "args": { + "External id": 231585,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115546238.105, "dur": 2.527, + "args": { + "External id": 231586,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115546239.931, "dur": 0.574, + "args": { + "External id": 231587,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115546245.793, "dur": 59031.716, + "args": { + "External id": 231588,"Record function id": 0, "Sequence number": 2757783, "Fwd thread id": 1, "Ev Idx": 1699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115546247.024, "dur": 59022.446, + "args": { + "External id": 231589,"Sequence number": 2757783, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1700 + } + }, + { + "ph": "f", "id": 173, "pid": 4183442, "tid": 31331, "ts": 667115546247.024, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.19)", "pid": 4183442, "tid": 31331, + "ts": 667115546277.799, "dur": 40.672, + "args": { + "External id": 231590,"Record function id": 0, "Ev Idx": 1701 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.19)", "pid": 4183442, "tid": 31331, + "ts": 667115546325.891, "dur": 86.286, + "args": { + "External id": 231591,"Record function id": 0, "Ev Idx": 1702 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.19)", "pid": 4183442, "tid": 31331, + "ts": 667115546417.983, "dur": 58843.587, + "args": { + "External id": 231592,"Record function id": 0, "Ev Idx": 1703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115546471.782, "dur": 7.672, + "args": { + "External id": 231593,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115546489.132, "dur": 24.055, + "args": { + "External id": 231594,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115546533.377, "dur": 57947.556, + "args": { + "External id": 231595,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115546547.593, "dur": 57925.481, + "args": { + "External id": 231596,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115546578.450, "dur": 7.980, + "args": { + "External id": 231597,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115546593.262, "dur": 57842.523, + "args": { + "External id": 231598,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 1709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115546595.527, "dur": 57839.573, + "args": { + "External id": 231599,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 1710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115546599.430, "dur": 5.923, + "args": { + "External id": 231600,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115546606.902, "dur": 57824.352, + "args": { + "External id": 231601,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 1712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115604583.996, "dur": 10.078, + "args": { + "External id": 231602,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 1713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115604587.426, "dur": 6.042, + "args": { + "External id": 231603,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115604622.701, "dur": 324.063, + "args": { + "External id": 231604,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 1715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115604678.450, "dur": 263.548, + "args": { + "External id": 231605,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1716, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115604693.883, "dur": 243.124, + "args": { + "External id": 231606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 1717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115604967.379, "dur": 1.932, + "args": { + "External id": 231607,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1718, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605027.070, "dur": 5.916, + "args": { + "External id": 231608,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605090.445, "dur": 1.600, + "args": { + "External id": 231609,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605111.640, "dur": 1.122, + "args": { + "External id": 231610,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605129.093, "dur": 1.305, + "args": { + "External id": 231611,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605143.484, "dur": 0.929, + "args": { + "External id": 231612,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605155.618, "dur": 1.195, + "args": { + "External id": 231613,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605168.588, "dur": 1.013, + "args": { + "External id": 231614,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605185.032, "dur": 2.918, + "args": { + "External id": 231615,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605200.620, "dur": 1.038, + "args": { + "External id": 231616,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115605290.813, "dur": 2741.643, + "args": { + "External id": 231617,"Record function id": 0, "Ev Idx": 1728 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.18)", "pid": 4183442, "tid": 31331, + "ts": 667115605309.835, "dur": 1045.855, + "args": { + "External id": 231618,"Record function id": 0, "Ev Idx": 1729 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 4183442, "tid": 31331, + "ts": 667115605323.098, "dur": 371.860, + "args": { + "External id": 231619,"Record function id": 0, "Ev Idx": 1730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605408.355, "dur": 3.941, + "args": { + "External id": 231620,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605415.632, "dur": 1.462, + "args": { + "External id": 231621,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605418.899, "dur": 1.015, + "args": { + "External id": 231622,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605421.830, "dur": 2.585, + "args": { + "External id": 231623,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605426.357, "dur": 1.025, + "args": { + "External id": 231624,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605430.867, "dur": 0.884, + "args": { + "External id": 231625,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605433.526, "dur": 2.717, + "args": { + "External id": 231626,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605438.055, "dur": 0.855, + "args": { + "External id": 231627,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605440.731, "dur": 0.947, + "args": { + "External id": 231628,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115605444.645, "dur": 0.811, + "args": { + "External id": 231629,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115605464.037, "dur": 165.055, + "args": { + "External id": 231630,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115605480.280, "dur": 144.402, + "args": { + "External id": 231631,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115605516.692, "dur": 12.802, + "args": { + "External id": 231632,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115605532.640, "dur": 62.647, + "args": { + "External id": 231633,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 1744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115605534.918, "dur": 60.073, + "args": { + "External id": 231634,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 1745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605538.749, "dur": 7.935, + "args": { + "External id": 231635,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115605548.195, "dur": 46.087, + "args": { + "External id": 231636,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 1747 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.17", "pid": 4183442, "tid": 31331, + "ts": 667115605792.306, "dur": 556.472, + "args": { + "External id": 231637,"Record function id": 0, "Ev Idx": 1748 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 4183442, "tid": 31331, + "ts": 667115605809.379, "dur": 526.076, + "args": { + "External id": 231638,"Record function id": 0, "Ev Idx": 1749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115605870.269, "dur": 5.271, + "args": { + "External id": 231639,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115605890.919, "dur": 33.509, + "args": { + "External id": 231640,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605895.921, "dur": 2.920, + "args": { + "External id": 231641,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605901.134, "dur": 0.393, + "args": { + "External id": 231642,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605902.992, "dur": 0.516, + "args": { + "External id": 231643,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605905.825, "dur": 0.401, + "args": { + "External id": 231644,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605907.360, "dur": 0.534, + "args": { + "External id": 231645,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605909.569, "dur": 0.351, + "args": { + "External id": 231646,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605912.031, "dur": 2.036, + "args": { + "External id": 231647,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605915.636, "dur": 0.478, + "args": { + "External id": 231648,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115605917.367, "dur": 0.786, + "args": { + "External id": 231649,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115605937.849, "dur": 34.314, + "args": { + "External id": 231650,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115606003.756, "dur": 103.472, + "args": { + "External id": 231651,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 1762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115606013.431, "dur": 3.843, + "args": { + "External id": 231652,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115606022.720, "dur": 9.938, + "args": { + "External id": 231653,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115606026.769, "dur": 5.466, + "args": { + "External id": 231654,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 1765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606030.337, "dur": 0.622, + "args": { + "External id": 231655,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115606039.285, "dur": 27.557, + "args": { + "External id": 231656,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606041.333, "dur": 0.565, + "args": { + "External id": 231657,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606043.640, "dur": 1.180, + "args": { + "External id": 231658,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606046.360, "dur": 0.646, + "args": { + "External id": 231659,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606048.420, "dur": 2.188, + "args": { + "External id": 231660,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606053.301, "dur": 0.373, + "args": { + "External id": 231661,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606055.077, "dur": 0.262, + "args": { + "External id": 231662,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606056.581, "dur": 0.215, + "args": { + "External id": 231663,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606059.190, "dur": 0.345, + "args": { + "External id": 231664,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115606061.082, "dur": 0.380, + "args": { + "External id": 231665,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115606078.431, "dur": 20.713, + "args": { + "External id": 231666,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115606149.989, "dur": 118.558, + "args": { + "External id": 231667,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 1778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115606177.450, "dur": 87.701, + "args": { + "External id": 231668,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1779, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115606187.954, "dur": 73.397, + "args": { + "External id": 231669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 1780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115606285.823, "dur": 1.750, + "args": { + "External id": 231670,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1781, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115606362.085, "dur": 1644.833, + "args": { + "External id": 231671,"Sequence number": 2757782, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1782 + } + }, + { + "ph": "f", "id": 174, "pid": 4183442, "tid": 31331, "ts": 667115606362.085, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115606471.131, "dur": 123.598, + "args": { + "External id": 231672,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 1783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115606644.598, "dur": 78.581, + "args": { + "External id": 231673,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 1784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115606743.520, "dur": 47.313, + "args": { + "External id": 231674,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 1785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115606801.241, "dur": 28.741, + "args": { + "External id": 231675,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115606839.143, "dur": 34.137, + "args": { + "External id": 231676,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115606880.086, "dur": 21.820, + "args": { + "External id": 231677,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115606908.573, "dur": 28.289, + "args": { + "External id": 231678,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115606961.790, "dur": 22.960, + "args": { + "External id": 231679,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 1790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115607003.952, "dur": 25.662, + "args": { + "External id": 231680,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115607051.600, "dur": 19.589, + "args": { + "External id": 231681,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115607084.453, "dur": 14.802, + "args": { + "External id": 231682,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607107.004, "dur": 36.958, + "args": { + "External id": 231683,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607147.444, "dur": 33.135, + "args": { + "External id": 231684,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115607209.637, "dur": 167.789, + "args": { + "External id": 231685,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115607288.865, "dur": 6.442, + "args": { + "External id": 231686,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115607297.228, "dur": 1.938, + "args": { + "External id": 231687,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115607421.550, "dur": 24.334, + "args": { + "External id": 231688,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115607460.351, "dur": 12.130, + "args": { + "External id": 231689,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607480.174, "dur": 61.540, + "args": { + "External id": 231690,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607549.711, "dur": 32.042, + "args": { + "External id": 231691,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607591.461, "dur": 28.147, + "args": { + "External id": 231692,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607624.107, "dur": 61.817, + "args": { + "External id": 231693,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607696.674, "dur": 32.011, + "args": { + "External id": 231694,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115607747.225, "dur": 38.904, + "args": { + "External id": 231695,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115607811.918, "dur": 22.993, + "args": { + "External id": 231696,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 1807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115607857.077, "dur": 23.968, + "args": { + "External id": 231697,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115607897.537, "dur": 17.691, + "args": { + "External id": 231698,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115607931.477, "dur": 13.335, + "args": { + "External id": 231699,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115607959.752, "dur": 18.705, + "args": { + "External id": 231700,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 1811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608053.211, "dur": 14.916, + "args": { + "External id": 231701,"Record function id": 0, "Ev Idx": 1812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608056.643, "dur": 10.493, + "args": { + "External id": 231702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608060.707, "dur": 5.344, + "args": { + "External id": 231703,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608062.079, "dur": 3.871, + "args": { + "External id": 231704,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608072.028, "dur": 6.094, + "args": { + "External id": 231705,"Record function id": 0, "Ev Idx": 1816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608073.780, "dur": 3.806, + "args": { + "External id": 231706,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608075.206, "dur": 1.744, + "args": { + "External id": 231707,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608075.872, "dur": 0.989, + "args": { + "External id": 231708,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608081.448, "dur": 10.496, + "args": { + "External id": 231709,"Record function id": 0, "Ev Idx": 1820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608083.084, "dur": 8.416, + "args": { + "External id": 231710,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608084.051, "dur": 7.016, + "args": { + "External id": 231711,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608084.616, "dur": 6.317, + "args": { + "External id": 231712,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608095.107, "dur": 5.026, + "args": { + "External id": 231713,"Record function id": 0, "Ev Idx": 1824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608096.839, "dur": 2.881, + "args": { + "External id": 231714,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608097.801, "dur": 1.467, + "args": { + "External id": 231715,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608098.316, "dur": 0.841, + "args": { + "External id": 231716,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608103.272, "dur": 3.761, + "args": { + "External id": 231717,"Record function id": 0, "Ev Idx": 1828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608104.798, "dur": 1.815, + "args": { + "External id": 231718,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608105.285, "dur": 0.925, + "args": { + "External id": 231719,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608105.536, "dur": 0.604, + "args": { + "External id": 231720,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608110.153, "dur": 4.275, + "args": { + "External id": 231721,"Record function id": 0, "Ev Idx": 1832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608111.272, "dur": 2.702, + "args": { + "External id": 231722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608112.174, "dur": 1.361, + "args": { + "External id": 231723,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608112.843, "dur": 0.626, + "args": { + "External id": 231724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608117.734, "dur": 4.008, + "args": { + "External id": 231725,"Record function id": 0, "Ev Idx": 1836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608118.996, "dur": 2.340, + "args": { + "External id": 231726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608119.686, "dur": 1.099, + "args": { + "External id": 231727,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608119.968, "dur": 0.747, + "args": { + "External id": 231728,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608124.916, "dur": 3.333, + "args": { + "External id": 231729,"Record function id": 0, "Ev Idx": 1840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608125.901, "dur": 1.929, + "args": { + "External id": 231730,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608126.349, "dur": 1.027, + "args": { + "External id": 231731,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608126.603, "dur": 0.707, + "args": { + "External id": 231732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608131.334, "dur": 5.445, + "args": { + "External id": 231733,"Record function id": 0, "Ev Idx": 1844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115608132.551, "dur": 3.827, + "args": { + "External id": 231734,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115608133.288, "dur": 2.557, + "args": { + "External id": 231735,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115608135.060, "dur": 0.717, + "args": { + "External id": 231736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115608140.712, "dur": 15695.823, + "args": { + "External id": 231737,"Record function id": 0, "Sequence number": 2757781, "Fwd thread id": 1, "Ev Idx": 1848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115608141.849, "dur": 15686.352, + "args": { + "External id": 231738,"Sequence number": 2757781, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1849 + } + }, + { + "ph": "f", "id": 175, "pid": 4183442, "tid": 31331, "ts": 667115608141.849, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.18)", "pid": 4183442, "tid": 31331, + "ts": 667115608175.353, "dur": 38.736, + "args": { + "External id": 231739,"Record function id": 0, "Ev Idx": 1850 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.18)", "pid": 4183442, "tid": 31331, + "ts": 667115608221.525, "dur": 66.473, + "args": { + "External id": 231740,"Record function id": 0, "Ev Idx": 1851 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.18)", "pid": 4183442, "tid": 31331, + "ts": 667115608293.789, "dur": 15526.555, + "args": { + "External id": 231741,"Record function id": 0, "Ev Idx": 1852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115608377.779, "dur": 10.231, + "args": { + "External id": 231742,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115608397.065, "dur": 6.127, + "args": { + "External id": 231743,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115608420.967, "dur": 14622.000, + "args": { + "External id": 231744,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115608434.218, "dur": 14600.154, + "args": { + "External id": 231745,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115608462.692, "dur": 13.563, + "args": { + "External id": 231746,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115608481.695, "dur": 14519.189, + "args": { + "External id": 231747,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 1858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115608484.052, "dur": 14516.154, + "args": { + "External id": 231748,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 1859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115608489.168, "dur": 26.465, + "args": { + "External id": 231749,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115608518.210, "dur": 14478.648, + "args": { + "External id": 231750,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 1861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115623130.108, "dur": 9.467, + "args": { + "External id": 231751,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 1862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115623133.292, "dur": 5.901, + "args": { + "External id": 231752,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115623169.782, "dur": 298.048, + "args": { + "External id": 231753,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 1864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115623198.736, "dur": 265.059, + "args": { + "External id": 231754,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1865, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115623211.407, "dur": 247.706, + "args": { + "External id": 231755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 1866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115623486.531, "dur": 1.846, + "args": { + "External id": 231756,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1867, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623559.010, "dur": 6.135, + "args": { + "External id": 231757,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623612.282, "dur": 1.323, + "args": { + "External id": 231758,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623630.001, "dur": 3.113, + "args": { + "External id": 231759,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623646.488, "dur": 0.950, + "args": { + "External id": 231760,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623697.553, "dur": 1.246, + "args": { + "External id": 231761,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623711.826, "dur": 0.907, + "args": { + "External id": 231762,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623725.053, "dur": 3.084, + "args": { + "External id": 231763,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623741.745, "dur": 3.176, + "args": { + "External id": 231764,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115623756.600, "dur": 1.087, + "args": { + "External id": 231765,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115623852.281, "dur": 2625.198, + "args": { + "External id": 231766,"Record function id": 0, "Ev Idx": 1877 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.17)", "pid": 4183442, "tid": 31331, + "ts": 667115623872.846, "dur": 1012.189, + "args": { + "External id": 231767,"Record function id": 0, "Ev Idx": 1878 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 4183442, "tid": 31331, + "ts": 667115623888.682, "dur": 301.094, + "args": { + "External id": 231768,"Record function id": 0, "Ev Idx": 1879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623970.100, "dur": 4.167, + "args": { + "External id": 231769,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623977.501, "dur": 1.510, + "args": { + "External id": 231770,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623980.841, "dur": 2.686, + "args": { + "External id": 231771,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623985.175, "dur": 0.928, + "args": { + "External id": 231772,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623989.349, "dur": 1.072, + "args": { + "External id": 231773,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623991.787, "dur": 1.048, + "args": { + "External id": 231774,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623994.624, "dur": 1.929, + "args": { + "External id": 231775,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115623997.910, "dur": 1.126, + "args": { + "External id": 231776,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115624002.141, "dur": 1.009, + "args": { + "External id": 231777,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115624004.418, "dur": 0.927, + "args": { + "External id": 231778,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115624022.215, "dur": 140.444, + "args": { + "External id": 231779,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115624037.544, "dur": 120.858, + "args": { + "External id": 231780,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115624053.260, "dur": 13.102, + "args": { + "External id": 231781,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115624068.933, "dur": 63.553, + "args": { + "External id": 231782,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 1893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115624071.638, "dur": 60.526, + "args": { + "External id": 231783,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 1894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624075.974, "dur": 5.411, + "args": { + "External id": 231784,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115624084.553, "dur": 47.105, + "args": { + "External id": 231785,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 1896 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.16", "pid": 4183442, "tid": 31331, + "ts": 667115624271.882, "dur": 606.361, + "args": { + "External id": 231786,"Record function id": 0, "Ev Idx": 1897 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 4183442, "tid": 31331, + "ts": 667115624287.812, "dur": 578.652, + "args": { + "External id": 231787,"Record function id": 0, "Ev Idx": 1898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115624343.977, "dur": 4.357, + "args": { + "External id": 231788,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115624362.761, "dur": 30.977, + "args": { + "External id": 231789,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624366.974, "dur": 1.126, + "args": { + "External id": 231790,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624369.796, "dur": 1.768, + "args": { + "External id": 231791,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624372.841, "dur": 0.879, + "args": { + "External id": 231792,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624374.851, "dur": 0.560, + "args": { + "External id": 231793,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624378.309, "dur": 0.500, + "args": { + "External id": 231794,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624379.852, "dur": 2.408, + "args": { + "External id": 231795,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624383.195, "dur": 0.510, + "args": { + "External id": 231796,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624385.706, "dur": 0.381, + "args": { + "External id": 231797,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624387.326, "dur": 0.585, + "args": { + "External id": 231798,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115624403.027, "dur": 29.058, + "args": { + "External id": 231799,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115624461.611, "dur": 132.406, + "args": { + "External id": 231800,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 1911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115624470.459, "dur": 3.646, + "args": { + "External id": 231801,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115624478.886, "dur": 9.267, + "args": { + "External id": 231802,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115624482.548, "dur": 5.193, + "args": { + "External id": 231803,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 1914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624485.634, "dur": 0.874, + "args": { + "External id": 231804,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115624515.464, "dur": 36.982, + "args": { + "External id": 231805,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624517.728, "dur": 0.813, + "args": { + "External id": 231806,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624521.983, "dur": 0.464, + "args": { + "External id": 231807,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624531.916, "dur": 2.381, + "args": { + "External id": 231808,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624535.504, "dur": 1.391, + "args": { + "External id": 231809,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624537.919, "dur": 0.463, + "args": { + "External id": 231810,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624539.602, "dur": 0.520, + "args": { + "External id": 231811,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624543.028, "dur": 0.420, + "args": { + "External id": 231812,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624544.220, "dur": 0.389, + "args": { + "External id": 231813,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115624545.550, "dur": 0.309, + "args": { + "External id": 231814,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115624563.630, "dur": 22.004, + "args": { + "External id": 231815,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115624637.998, "dur": 158.711, + "args": { + "External id": 231816,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 1927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115624700.319, "dur": 92.385, + "args": { + "External id": 231817,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1928, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115624714.249, "dur": 74.623, + "args": { + "External id": 231818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 1929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115624813.725, "dur": 1.935, + "args": { + "External id": 231819,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1930, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115624892.217, "dur": 1563.727, + "args": { + "External id": 231820,"Sequence number": 2757780, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1931 + } + }, + { + "ph": "f", "id": 176, "pid": 4183442, "tid": 31331, "ts": 667115624892.217, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625003.944, "dur": 95.658, + "args": { + "External id": 231821,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 1932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115625137.819, "dur": 36.104, + "args": { + "External id": 231822,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 1933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115625190.575, "dur": 39.921, + "args": { + "External id": 231823,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 1934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625241.284, "dur": 25.240, + "args": { + "External id": 231824,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625273.617, "dur": 35.715, + "args": { + "External id": 231825,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625315.645, "dur": 20.374, + "args": { + "External id": 231826,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625350.696, "dur": 29.939, + "args": { + "External id": 231827,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115625408.125, "dur": 23.051, + "args": { + "External id": 231828,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 1939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115625448.743, "dur": 27.164, + "args": { + "External id": 231829,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115625516.978, "dur": 20.908, + "args": { + "External id": 231830,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115625554.413, "dur": 14.183, + "args": { + "External id": 231831,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625578.129, "dur": 39.798, + "args": { + "External id": 231832,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625621.473, "dur": 68.275, + "args": { + "External id": 231833,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115625722.787, "dur": 168.549, + "args": { + "External id": 231834,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115625800.147, "dur": 7.022, + "args": { + "External id": 231835,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115625809.207, "dur": 2.304, + "args": { + "External id": 231836,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115625928.190, "dur": 24.558, + "args": { + "External id": 231837,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115625965.193, "dur": 14.306, + "args": { + "External id": 231838,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115625990.474, "dur": 48.799, + "args": { + "External id": 231839,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115626044.702, "dur": 30.703, + "args": { + "External id": 231840,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115626082.960, "dur": 28.126, + "args": { + "External id": 231841,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115626115.344, "dur": 27.878, + "args": { + "External id": 231842,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115626148.947, "dur": 27.736, + "args": { + "External id": 231843,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115626186.388, "dur": 43.836, + "args": { + "External id": 231844,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115626259.358, "dur": 26.922, + "args": { + "External id": 231845,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 1956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115626303.236, "dur": 27.611, + "args": { + "External id": 231846,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115626346.449, "dur": 18.305, + "args": { + "External id": 231847,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115626380.557, "dur": 15.308, + "args": { + "External id": 231848,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115626410.034, "dur": 19.210, + "args": { + "External id": 231849,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 1960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626524.345, "dur": 16.685, + "args": { + "External id": 231850,"Record function id": 0, "Ev Idx": 1961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626527.894, "dur": 12.087, + "args": { + "External id": 231851,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626532.302, "dur": 6.351, + "args": { + "External id": 231852,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626534.073, "dur": 4.331, + "args": { + "External id": 231853,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626544.983, "dur": 10.651, + "args": { + "External id": 231854,"Record function id": 0, "Ev Idx": 1965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626546.345, "dur": 8.838, + "args": { + "External id": 231855,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626550.605, "dur": 4.015, + "args": { + "External id": 231856,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626551.247, "dur": 3.263, + "args": { + "External id": 231857,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626558.921, "dur": 5.246, + "args": { + "External id": 231858,"Record function id": 0, "Ev Idx": 1969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626560.596, "dur": 3.111, + "args": { + "External id": 231859,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626561.492, "dur": 1.809, + "args": { + "External id": 231860,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626562.016, "dur": 1.197, + "args": { + "External id": 231861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626567.562, "dur": 4.267, + "args": { + "External id": 231862,"Record function id": 0, "Ev Idx": 1973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626568.759, "dur": 2.615, + "args": { + "External id": 231863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626569.415, "dur": 1.410, + "args": { + "External id": 231864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626569.879, "dur": 0.857, + "args": { + "External id": 231865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626574.906, "dur": 3.705, + "args": { + "External id": 231866,"Record function id": 0, "Ev Idx": 1977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626575.952, "dur": 2.254, + "args": { + "External id": 231867,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626576.736, "dur": 1.053, + "args": { + "External id": 231868,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626577.011, "dur": 0.711, + "args": { + "External id": 231869,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626581.840, "dur": 4.423, + "args": { + "External id": 231870,"Record function id": 0, "Ev Idx": 1981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626582.858, "dur": 2.876, + "args": { + "External id": 231871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626583.708, "dur": 1.450, + "args": { + "External id": 231872,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626584.338, "dur": 0.719, + "args": { + "External id": 231873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626589.596, "dur": 3.853, + "args": { + "External id": 231874,"Record function id": 0, "Ev Idx": 1985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626590.683, "dur": 2.360, + "args": { + "External id": 231875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626591.513, "dur": 1.145, + "args": { + "External id": 231876,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626591.798, "dur": 0.733, + "args": { + "External id": 231877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626596.524, "dur": 5.637, + "args": { + "External id": 231878,"Record function id": 0, "Ev Idx": 1989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626597.531, "dur": 4.220, + "args": { + "External id": 231879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626598.220, "dur": 3.025, + "args": { + "External id": 231880,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626600.614, "dur": 0.566, + "args": { + "External id": 231881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626605.260, "dur": 8.379, + "args": { + "External id": 231882,"Record function id": 0, "Ev Idx": 1993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115626609.454, "dur": 3.784, + "args": { + "External id": 231883,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115626610.284, "dur": 2.403, + "args": { + "External id": 231884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115626610.563, "dur": 2.053, + "args": { + "External id": 231885,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115626617.453, "dur": 15358.408, + "args": { + "External id": 231886,"Record function id": 0, "Sequence number": 2757779, "Fwd thread id": 1, "Ev Idx": 1997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115626618.916, "dur": 15348.131, + "args": { + "External id": 231887,"Sequence number": 2757779, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1998 + } + }, + { + "ph": "f", "id": 177, "pid": 4183442, "tid": 31331, "ts": 667115626618.916, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.17)", "pid": 4183442, "tid": 31331, + "ts": 667115626650.555, "dur": 81.713, + "args": { + "External id": 231888,"Record function id": 0, "Ev Idx": 1999 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.17)", "pid": 4183442, "tid": 31331, + "ts": 667115626740.639, "dur": 64.515, + "args": { + "External id": 231889,"Record function id": 0, "Ev Idx": 2000 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.17)", "pid": 4183442, "tid": 31331, + "ts": 667115626812.789, "dur": 15147.058, + "args": { + "External id": 231890,"Record function id": 0, "Ev Idx": 2001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115626898.138, "dur": 7.412, + "args": { + "External id": 231891,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115626918.622, "dur": 5.058, + "args": { + "External id": 231892,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115626937.621, "dur": 14325.598, + "args": { + "External id": 231893,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115626950.527, "dur": 14304.100, + "args": { + "External id": 231894,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115626978.090, "dur": 13.815, + "args": { + "External id": 231895,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115626996.065, "dur": 14224.329, + "args": { + "External id": 231896,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115626998.652, "dur": 14220.816, + "args": { + "External id": 231897,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115627002.460, "dur": 4.941, + "args": { + "External id": 231898,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115627010.658, "dur": 14205.243, + "args": { + "External id": 231899,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115641348.819, "dur": 9.508, + "args": { + "External id": 231900,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115641351.799, "dur": 6.116, + "args": { + "External id": 231901,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115641384.605, "dur": 259.431, + "args": { + "External id": 231902,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115641412.884, "dur": 226.732, + "args": { + "External id": 231903,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2014, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115641423.438, "dur": 211.134, + "args": { + "External id": 231904,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115641693.948, "dur": 3.058, + "args": { + "External id": 231905,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2016, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641753.563, "dur": 6.017, + "args": { + "External id": 231906,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641803.800, "dur": 3.139, + "args": { + "External id": 231907,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641822.833, "dur": 1.222, + "args": { + "External id": 231908,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641836.118, "dur": 0.999, + "args": { + "External id": 231909,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641848.172, "dur": 1.189, + "args": { + "External id": 231910,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641860.008, "dur": 2.516, + "args": { + "External id": 231911,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641875.255, "dur": 0.934, + "args": { + "External id": 231912,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641887.279, "dur": 3.053, + "args": { + "External id": 231913,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115641899.835, "dur": 1.162, + "args": { + "External id": 231914,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115641990.478, "dur": 2636.713, + "args": { + "External id": 231915,"Record function id": 0, "Ev Idx": 2026 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.16)", "pid": 4183442, "tid": 31331, + "ts": 667115642009.116, "dur": 1025.535, + "args": { + "External id": 231916,"Record function id": 0, "Ev Idx": 2027 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 4183442, "tid": 31331, + "ts": 667115642023.361, "dur": 300.516, + "args": { + "External id": 231917,"Record function id": 0, "Ev Idx": 2028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642105.060, "dur": 5.764, + "args": { + "External id": 231918,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642113.926, "dur": 0.940, + "args": { + "External id": 231919,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642116.349, "dur": 1.189, + "args": { + "External id": 231920,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642120.604, "dur": 1.074, + "args": { + "External id": 231921,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642122.979, "dur": 0.866, + "args": { + "External id": 231922,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642125.244, "dur": 0.922, + "args": { + "External id": 231923,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642127.561, "dur": 1.804, + "args": { + "External id": 231924,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642132.135, "dur": 0.793, + "args": { + "External id": 231925,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642134.450, "dur": 2.560, + "args": { + "External id": 231926,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115642138.370, "dur": 0.928, + "args": { + "External id": 231927,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115642155.802, "dur": 141.253, + "args": { + "External id": 231928,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115642170.582, "dur": 122.882, + "args": { + "External id": 231929,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115642186.139, "dur": 13.497, + "args": { + "External id": 231930,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115642204.247, "dur": 62.463, + "args": { + "External id": 231931,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115642206.658, "dur": 59.679, + "args": { + "External id": 231932,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642211.602, "dur": 5.783, + "args": { + "External id": 231933,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115642219.118, "dur": 46.591, + "args": { + "External id": 231934,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2045 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.15", "pid": 4183442, "tid": 31331, + "ts": 667115642408.185, "dur": 618.737, + "args": { + "External id": 231935,"Record function id": 0, "Ev Idx": 2046 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 4183442, "tid": 31331, + "ts": 667115642424.132, "dur": 590.827, + "args": { + "External id": 231936,"Record function id": 0, "Ev Idx": 2047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115642522.463, "dur": 6.833, + "args": { + "External id": 231937,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115642545.586, "dur": 26.046, + "args": { + "External id": 231938,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642549.810, "dur": 1.555, + "args": { + "External id": 231939,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642553.762, "dur": 0.482, + "args": { + "External id": 231940,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642555.390, "dur": 0.411, + "args": { + "External id": 231941,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642556.462, "dur": 2.868, + "args": { + "External id": 231942,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642560.114, "dur": 0.319, + "args": { + "External id": 231943,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642561.111, "dur": 0.502, + "args": { + "External id": 231944,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642563.664, "dur": 0.495, + "args": { + "External id": 231945,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642564.841, "dur": 0.328, + "args": { + "External id": 231946,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642565.966, "dur": 0.350, + "args": { + "External id": 231947,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115642581.898, "dur": 32.462, + "args": { + "External id": 231948,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115642646.249, "dur": 141.231, + "args": { + "External id": 231949,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115642694.201, "dur": 4.842, + "args": { + "External id": 231950,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115642704.686, "dur": 10.139, + "args": { + "External id": 231951,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115642708.819, "dur": 5.598, + "args": { + "External id": 231952,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642711.600, "dur": 1.479, + "args": { + "External id": 231953,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115642722.181, "dur": 21.842, + "args": { + "External id": 231954,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642724.302, "dur": 2.068, + "args": { + "External id": 231955,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642727.629, "dur": 0.503, + "args": { + "External id": 231956,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642728.838, "dur": 0.310, + "args": { + "External id": 231957,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642731.205, "dur": 0.342, + "args": { + "External id": 231958,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642732.174, "dur": 0.436, + "args": { + "External id": 231959,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642733.301, "dur": 1.216, + "args": { + "External id": 231960,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642735.231, "dur": 0.463, + "args": { + "External id": 231961,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642736.291, "dur": 0.251, + "args": { + "External id": 231962,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115642738.400, "dur": 1.668, + "args": { + "External id": 231963,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115642756.245, "dur": 23.104, + "args": { + "External id": 231964,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115642835.388, "dur": 112.585, + "args": { + "External id": 231965,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115642862.889, "dur": 81.833, + "args": { + "External id": 231966,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2077, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115642871.828, "dur": 68.767, + "args": { + "External id": 231967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115642963.852, "dur": 1.690, + "args": { + "External id": 231968,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2079, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115643041.665, "dur": 1561.158, + "args": { + "External id": 231969,"Sequence number": 2757778, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2080 + } + }, + { + "ph": "f", "id": 178, "pid": 4183442, "tid": 31331, "ts": 667115643041.665, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115643152.429, "dur": 96.978, + "args": { + "External id": 231970,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115643286.639, "dur": 37.625, + "args": { + "External id": 231971,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115643342.596, "dur": 39.918, + "args": { + "External id": 231972,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115643392.447, "dur": 27.100, + "args": { + "External id": 231973,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115643426.266, "dur": 33.826, + "args": { + "External id": 231974,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115643466.492, "dur": 44.767, + "args": { + "External id": 231975,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115643523.501, "dur": 36.677, + "args": { + "External id": 231976,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115643586.712, "dur": 22.574, + "args": { + "External id": 231977,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115643626.224, "dur": 60.597, + "args": { + "External id": 231978,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115643713.049, "dur": 20.370, + "args": { + "External id": 231979,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115643747.195, "dur": 14.499, + "args": { + "External id": 231980,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115643771.428, "dur": 41.300, + "args": { + "External id": 231981,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115643816.566, "dur": 32.079, + "args": { + "External id": 231982,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115643878.172, "dur": 170.130, + "args": { + "External id": 231983,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115643958.161, "dur": 6.148, + "args": { + "External id": 231984,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115643966.604, "dur": 2.363, + "args": { + "External id": 231985,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115644082.169, "dur": 23.617, + "args": { + "External id": 231986,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115644116.252, "dur": 12.490, + "args": { + "External id": 231987,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115644137.095, "dur": 40.079, + "args": { + "External id": 231988,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115644187.273, "dur": 30.592, + "args": { + "External id": 231989,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115644223.957, "dur": 29.401, + "args": { + "External id": 231990,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115644257.589, "dur": 27.486, + "args": { + "External id": 231991,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115644290.434, "dur": 25.924, + "args": { + "External id": 231992,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115644324.871, "dur": 27.592, + "args": { + "External id": 231993,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115644382.201, "dur": 31.268, + "args": { + "External id": 231994,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115644431.686, "dur": 21.849, + "args": { + "External id": 231995,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115644472.011, "dur": 15.386, + "args": { + "External id": 231996,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115644523.583, "dur": 21.098, + "args": { + "External id": 231997,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115644556.802, "dur": 14.662, + "args": { + "External id": 231998,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644648.214, "dur": 53.964, + "args": { + "External id": 231999,"Record function id": 0, "Ev Idx": 2110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644686.589, "dur": 14.230, + "args": { + "External id": 232000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644691.547, "dur": 8.091, + "args": { + "External id": 232001,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644692.971, "dur": 6.371, + "args": { + "External id": 232002,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644708.534, "dur": 5.549, + "args": { + "External id": 232003,"Record function id": 0, "Ev Idx": 2114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644710.382, "dur": 3.245, + "args": { + "External id": 232004,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644711.700, "dur": 1.491, + "args": { + "External id": 232005,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644712.263, "dur": 0.830, + "args": { + "External id": 232006,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644717.825, "dur": 4.680, + "args": { + "External id": 232007,"Record function id": 0, "Ev Idx": 2118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644719.351, "dur": 2.736, + "args": { + "External id": 232008,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644720.275, "dur": 1.398, + "args": { + "External id": 232009,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644720.719, "dur": 0.866, + "args": { + "External id": 232010,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644725.739, "dur": 3.596, + "args": { + "External id": 232011,"Record function id": 0, "Ev Idx": 2122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644726.819, "dur": 2.075, + "args": { + "External id": 232012,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644727.321, "dur": 1.161, + "args": { + "External id": 232013,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644727.698, "dur": 0.711, + "args": { + "External id": 232014,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644732.711, "dur": 5.194, + "args": { + "External id": 232015,"Record function id": 0, "Ev Idx": 2126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644733.825, "dur": 3.619, + "args": { + "External id": 232016,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644734.504, "dur": 2.491, + "args": { + "External id": 232017,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644736.279, "dur": 0.586, + "args": { + "External id": 232018,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644741.026, "dur": 3.861, + "args": { + "External id": 232019,"Record function id": 0, "Ev Idx": 2130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644742.302, "dur": 2.169, + "args": { + "External id": 232020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644742.804, "dur": 1.074, + "args": { + "External id": 232021,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644743.121, "dur": 0.674, + "args": { + "External id": 232022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644748.243, "dur": 3.633, + "args": { + "External id": 232023,"Record function id": 0, "Ev Idx": 2134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644749.386, "dur": 2.007, + "args": { + "External id": 232024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644750.053, "dur": 0.936, + "args": { + "External id": 232025,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644750.302, "dur": 0.620, + "args": { + "External id": 232026,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644758.314, "dur": 5.793, + "args": { + "External id": 232027,"Record function id": 0, "Ev Idx": 2138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644759.641, "dur": 4.067, + "args": { + "External id": 232028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644760.298, "dur": 2.871, + "args": { + "External id": 232029,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644760.634, "dur": 2.464, + "args": { + "External id": 232030,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644767.131, "dur": 5.312, + "args": { + "External id": 232031,"Record function id": 0, "Ev Idx": 2142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115644768.477, "dur": 3.524, + "args": { + "External id": 232032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115644768.930, "dur": 2.709, + "args": { + "External id": 232033,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115644770.710, "dur": 0.839, + "args": { + "External id": 232034,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115644776.246, "dur": 16495.432, + "args": { + "External id": 232035,"Record function id": 0, "Sequence number": 2757777, "Fwd thread id": 1, "Ev Idx": 2146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115644777.853, "dur": 16485.979, + "args": { + "External id": 232036,"Sequence number": 2757777, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2147 + } + }, + { + "ph": "f", "id": 179, "pid": 4183442, "tid": 31331, "ts": 667115644777.853, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.16)", "pid": 4183442, "tid": 31331, + "ts": 667115644809.856, "dur": 39.980, + "args": { + "External id": 232037,"Record function id": 0, "Ev Idx": 2148 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.16)", "pid": 4183442, "tid": 31331, + "ts": 667115644857.099, "dur": 66.945, + "args": { + "External id": 232038,"Record function id": 0, "Ev Idx": 2149 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.16)", "pid": 4183442, "tid": 31331, + "ts": 667115644933.092, "dur": 16323.536, + "args": { + "External id": 232039,"Record function id": 0, "Ev Idx": 2150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115645017.966, "dur": 7.095, + "args": { + "External id": 232040,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115645034.263, "dur": 4.853, + "args": { + "External id": 232041,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115645054.003, "dur": 15479.799, + "args": { + "External id": 232042,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115645068.459, "dur": 15457.269, + "args": { + "External id": 232043,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115645101.232, "dur": 13.676, + "args": { + "External id": 232044,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115645118.892, "dur": 15360.063, + "args": { + "External id": 232045,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115645121.328, "dur": 15356.903, + "args": { + "External id": 232046,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115645125.355, "dur": 4.499, + "args": { + "External id": 232047,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115645131.540, "dur": 15343.432, + "args": { + "External id": 232048,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115660619.222, "dur": 8.977, + "args": { + "External id": 232049,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115660621.917, "dur": 5.932, + "args": { + "External id": 232050,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115660683.633, "dur": 295.255, + "args": { + "External id": 232051,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115660712.543, "dur": 261.834, + "args": { + "External id": 232052,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2163, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115660724.385, "dur": 245.410, + "args": { + "External id": 232053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115660998.115, "dur": 2.172, + "args": { + "External id": 232054,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2165, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661054.775, "dur": 6.302, + "args": { + "External id": 232055,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661106.209, "dur": 1.173, + "args": { + "External id": 232056,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661122.637, "dur": 1.174, + "args": { + "External id": 232057,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661134.912, "dur": 1.154, + "args": { + "External id": 232058,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661147.364, "dur": 0.797, + "args": { + "External id": 232059,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661160.332, "dur": 0.811, + "args": { + "External id": 232060,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661171.200, "dur": 0.716, + "args": { + "External id": 232061,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661184.679, "dur": 1.815, + "args": { + "External id": 232062,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661196.057, "dur": 0.857, + "args": { + "External id": 232063,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115661284.762, "dur": 2656.424, + "args": { + "External id": 232064,"Record function id": 0, "Ev Idx": 2175 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.15)", "pid": 4183442, "tid": 31331, + "ts": 667115661303.473, "dur": 986.365, + "args": { + "External id": 232065,"Record function id": 0, "Ev Idx": 2176 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 4183442, "tid": 31331, + "ts": 667115661317.185, "dur": 314.335, + "args": { + "External id": 232066,"Record function id": 0, "Ev Idx": 2177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661394.987, "dur": 3.918, + "args": { + "External id": 232067,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661401.879, "dur": 1.060, + "args": { + "External id": 232068,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661404.824, "dur": 1.164, + "args": { + "External id": 232069,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661407.552, "dur": 0.798, + "args": { + "External id": 232070,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661410.047, "dur": 1.042, + "args": { + "External id": 232071,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661413.817, "dur": 1.263, + "args": { + "External id": 232072,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661416.675, "dur": 1.784, + "args": { + "External id": 232073,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661419.944, "dur": 2.739, + "args": { + "External id": 232074,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661424.492, "dur": 0.743, + "args": { + "External id": 232075,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115661427.467, "dur": 0.943, + "args": { + "External id": 232076,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115661445.402, "dur": 157.191, + "args": { + "External id": 232077,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115661461.435, "dur": 136.677, + "args": { + "External id": 232078,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115661474.395, "dur": 14.183, + "args": { + "External id": 232079,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115661510.030, "dur": 62.090, + "args": { + "External id": 232080,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115661513.283, "dur": 58.493, + "args": { + "External id": 232081,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661518.428, "dur": 5.530, + "args": { + "External id": 232082,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115661525.781, "dur": 45.179, + "args": { + "External id": 232083,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2194 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.14", "pid": 4183442, "tid": 31331, + "ts": 667115661756.953, "dur": 525.763, + "args": { + "External id": 232084,"Record function id": 0, "Ev Idx": 2195 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 4183442, "tid": 31331, + "ts": 667115661774.778, "dur": 496.703, + "args": { + "External id": 232085,"Record function id": 0, "Ev Idx": 2196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115661834.039, "dur": 5.265, + "args": { + "External id": 232086,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115661853.371, "dur": 30.733, + "args": { + "External id": 232087,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661858.200, "dur": 1.421, + "args": { + "External id": 232088,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661861.695, "dur": 0.585, + "args": { + "External id": 232089,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661864.643, "dur": 2.247, + "args": { + "External id": 232090,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661868.220, "dur": 0.379, + "args": { + "External id": 232091,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661869.792, "dur": 1.060, + "args": { + "External id": 232092,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661872.470, "dur": 0.330, + "args": { + "External id": 232093,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661874.233, "dur": 0.342, + "args": { + "External id": 232094,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661876.543, "dur": 0.383, + "args": { + "External id": 232095,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661878.680, "dur": 0.482, + "args": { + "External id": 232096,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115661896.650, "dur": 33.669, + "args": { + "External id": 232097,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115661961.369, "dur": 99.510, + "args": { + "External id": 232098,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115661971.462, "dur": 2.956, + "args": { + "External id": 232099,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115661979.495, "dur": 11.800, + "args": { + "External id": 232100,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115661983.350, "dur": 7.520, + "args": { + "External id": 232101,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115661987.104, "dur": 2.592, + "args": { + "External id": 232102,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115661998.424, "dur": 23.445, + "args": { + "External id": 232103,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662000.406, "dur": 0.528, + "args": { + "External id": 232104,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662003.109, "dur": 0.399, + "args": { + "External id": 232105,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662004.927, "dur": 0.421, + "args": { + "External id": 232106,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662006.762, "dur": 0.380, + "args": { + "External id": 232107,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662008.707, "dur": 0.362, + "args": { + "External id": 232108,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662010.573, "dur": 0.460, + "args": { + "External id": 232109,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662012.272, "dur": 0.422, + "args": { + "External id": 232110,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662013.725, "dur": 2.195, + "args": { + "External id": 232111,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115662017.173, "dur": 0.342, + "args": { + "External id": 232112,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115662031.775, "dur": 21.254, + "args": { + "External id": 232113,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115662102.582, "dur": 108.937, + "args": { + "External id": 232114,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115662125.942, "dur": 82.301, + "args": { + "External id": 232115,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2226, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115662135.125, "dur": 68.967, + "args": { + "External id": 232116,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115662224.304, "dur": 1.868, + "args": { + "External id": 232117,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2228, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115662297.115, "dur": 1619.836, + "args": { + "External id": 232118,"Sequence number": 2757776, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2229 + } + }, + { + "ph": "f", "id": 180, "pid": 4183442, "tid": 31331, "ts": 667115662297.115, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115662406.166, "dur": 118.152, + "args": { + "External id": 232119,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115662566.073, "dur": 38.444, + "args": { + "External id": 232120,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115662623.594, "dur": 83.340, + "args": { + "External id": 232121,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115662722.110, "dur": 29.433, + "args": { + "External id": 232122,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115662757.316, "dur": 34.505, + "args": { + "External id": 232123,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115662797.915, "dur": 19.729, + "args": { + "External id": 232124,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115662826.282, "dur": 28.283, + "args": { + "External id": 232125,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115662879.060, "dur": 22.084, + "args": { + "External id": 232126,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115662918.490, "dur": 23.994, + "args": { + "External id": 232127,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115662960.883, "dur": 16.739, + "args": { + "External id": 232128,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115662990.418, "dur": 13.737, + "args": { + "External id": 232129,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663014.119, "dur": 37.508, + "args": { + "External id": 232130,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663054.996, "dur": 30.248, + "args": { + "External id": 232131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115663112.616, "dur": 175.687, + "args": { + "External id": 232132,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115663190.435, "dur": 5.051, + "args": { + "External id": 232133,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115663197.206, "dur": 2.830, + "args": { + "External id": 232134,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115663319.190, "dur": 27.696, + "args": { + "External id": 232135,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115663357.924, "dur": 14.218, + "args": { + "External id": 232136,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663381.403, "dur": 41.243, + "args": { + "External id": 232137,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663427.968, "dur": 31.712, + "args": { + "External id": 232138,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663472.758, "dur": 49.759, + "args": { + "External id": 232139,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663529.706, "dur": 31.305, + "args": { + "External id": 232140,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663568.558, "dur": 29.995, + "args": { + "External id": 232141,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115663605.766, "dur": 28.734, + "args": { + "External id": 232142,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115663699.472, "dur": 27.865, + "args": { + "External id": 232143,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115663750.002, "dur": 37.687, + "args": { + "External id": 232144,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115663808.410, "dur": 16.420, + "args": { + "External id": 232145,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115663843.584, "dur": 13.876, + "args": { + "External id": 232146,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115663868.801, "dur": 18.081, + "args": { + "External id": 232147,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115663962.458, "dur": 14.668, + "args": { + "External id": 232148,"Record function id": 0, "Ev Idx": 2259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115663965.657, "dur": 10.693, + "args": { + "External id": 232149,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115663969.913, "dur": 5.522, + "args": { + "External id": 232150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115663971.596, "dur": 3.754, + "args": { + "External id": 232151,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115663980.994, "dur": 5.018, + "args": { + "External id": 232152,"Record function id": 0, "Ev Idx": 2263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115663982.895, "dur": 2.662, + "args": { + "External id": 232153,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115663983.742, "dur": 1.327, + "args": { + "External id": 232154,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115663984.275, "dur": 0.721, + "args": { + "External id": 232155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115663992.409, "dur": 4.531, + "args": { + "External id": 232156,"Record function id": 0, "Ev Idx": 2267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115663993.857, "dur": 2.625, + "args": { + "External id": 232157,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115663994.588, "dur": 1.495, + "args": { + "External id": 232158,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115663995.233, "dur": 0.754, + "args": { + "External id": 232159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664000.343, "dur": 3.673, + "args": { + "External id": 232160,"Record function id": 0, "Ev Idx": 2271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664001.721, "dur": 1.880, + "args": { + "External id": 232161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115664002.249, "dur": 0.962, + "args": { + "External id": 232162,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115664002.601, "dur": 0.545, + "args": { + "External id": 232163,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664007.095, "dur": 3.497, + "args": { + "External id": 232164,"Record function id": 0, "Ev Idx": 2275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664008.191, "dur": 2.009, + "args": { + "External id": 232165,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115664008.683, "dur": 1.131, + "args": { + "External id": 232166,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115664009.165, "dur": 0.556, + "args": { + "External id": 232167,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664013.914, "dur": 3.760, + "args": { + "External id": 232168,"Record function id": 0, "Ev Idx": 2279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664015.128, "dur": 2.103, + "args": { + "External id": 232169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115664015.694, "dur": 1.129, + "args": { + "External id": 232170,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115664016.054, "dur": 0.700, + "args": { + "External id": 232171,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664020.930, "dur": 5.971, + "args": { + "External id": 232172,"Record function id": 0, "Ev Idx": 2283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664022.379, "dur": 4.120, + "args": { + "External id": 232173,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115664022.874, "dur": 3.240, + "args": { + "External id": 232174,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115664023.553, "dur": 2.493, + "args": { + "External id": 232175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664030.175, "dur": 3.482, + "args": { + "External id": 232176,"Record function id": 0, "Ev Idx": 2287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664031.420, "dur": 1.826, + "args": { + "External id": 232177,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115664031.891, "dur": 0.927, + "args": { + "External id": 232178,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115664032.163, "dur": 0.587, + "args": { + "External id": 232179,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664036.782, "dur": 3.439, + "args": { + "External id": 232180,"Record function id": 0, "Ev Idx": 2291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115664037.903, "dur": 1.917, + "args": { + "External id": 232181,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115664038.415, "dur": 0.968, + "args": { + "External id": 232182,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115664038.701, "dur": 0.615, + "args": { + "External id": 232183,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115664045.159, "dur": 14837.455, + "args": { + "External id": 232184,"Record function id": 0, "Sequence number": 2757775, "Fwd thread id": 1, "Ev Idx": 2295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115664049.866, "dur": 14824.365, + "args": { + "External id": 232185,"Sequence number": 2757775, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2296 + } + }, + { + "ph": "f", "id": 181, "pid": 4183442, "tid": 31331, "ts": 667115664049.866, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.15)", "pid": 4183442, "tid": 31331, + "ts": 667115664080.061, "dur": 39.450, + "args": { + "External id": 232186,"Record function id": 0, "Ev Idx": 2297 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.15)", "pid": 4183442, "tid": 31331, + "ts": 667115664127.464, "dur": 63.197, + "args": { + "External id": 232187,"Record function id": 0, "Ev Idx": 2298 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.15)", "pid": 4183442, "tid": 31331, + "ts": 667115664197.176, "dur": 14669.762, + "args": { + "External id": 232188,"Record function id": 0, "Ev Idx": 2299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115664286.427, "dur": 6.868, + "args": { + "External id": 232189,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115664303.086, "dur": 4.311, + "args": { + "External id": 232190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115664320.369, "dur": 13836.564, + "args": { + "External id": 232191,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115664337.448, "dur": 13811.579, + "args": { + "External id": 232192,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115664362.069, "dur": 13.955, + "args": { + "External id": 232193,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115664380.184, "dur": 13736.152, + "args": { + "External id": 232194,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115664384.078, "dur": 13731.469, + "args": { + "External id": 232195,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115664390.941, "dur": 4.171, + "args": { + "External id": 232196,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115664396.681, "dur": 13715.086, + "args": { + "External id": 232197,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115678243.317, "dur": 9.358, + "args": { + "External id": 232198,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115678246.080, "dur": 6.302, + "args": { + "External id": 232199,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115678280.082, "dur": 267.440, + "args": { + "External id": 232200,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115678307.308, "dur": 235.519, + "args": { + "External id": 232201,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2312, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115678319.186, "dur": 218.341, + "args": { + "External id": 232202,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115678567.561, "dur": 2.191, + "args": { + "External id": 232203,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2314, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678623.462, "dur": 7.383, + "args": { + "External id": 232204,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678707.511, "dur": 2.147, + "args": { + "External id": 232205,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678725.766, "dur": 1.396, + "args": { + "External id": 232206,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678739.841, "dur": 1.023, + "args": { + "External id": 232207,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678751.881, "dur": 2.179, + "args": { + "External id": 232208,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678765.780, "dur": 0.832, + "args": { + "External id": 232209,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678777.165, "dur": 0.869, + "args": { + "External id": 232210,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678788.692, "dur": 2.038, + "args": { + "External id": 232211,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115678801.353, "dur": 2.655, + "args": { + "External id": 232212,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115678897.093, "dur": 2588.205, + "args": { + "External id": 232213,"Record function id": 0, "Ev Idx": 2324 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.14)", "pid": 4183442, "tid": 31331, + "ts": 667115678916.751, "dur": 999.375, + "args": { + "External id": 232214,"Record function id": 0, "Ev Idx": 2325 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 4183442, "tid": 31331, + "ts": 667115678931.879, "dur": 294.386, + "args": { + "External id": 232215,"Record function id": 0, "Ev Idx": 2326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679010.203, "dur": 3.878, + "args": { + "External id": 232216,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679017.589, "dur": 1.204, + "args": { + "External id": 232217,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679020.846, "dur": 1.188, + "args": { + "External id": 232218,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679024.175, "dur": 1.191, + "args": { + "External id": 232219,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679027.122, "dur": 0.984, + "args": { + "External id": 232220,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679029.853, "dur": 1.227, + "args": { + "External id": 232221,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679033.255, "dur": 3.342, + "args": { + "External id": 232222,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679038.406, "dur": 0.847, + "args": { + "External id": 232223,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679040.888, "dur": 0.667, + "args": { + "External id": 232224,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115679043.084, "dur": 0.869, + "args": { + "External id": 232225,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115679062.262, "dur": 136.505, + "args": { + "External id": 232226,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115679077.605, "dur": 117.074, + "args": { + "External id": 232227,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115679093.547, "dur": 12.396, + "args": { + "External id": 232228,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115679108.181, "dur": 61.776, + "args": { + "External id": 232229,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115679110.958, "dur": 58.728, + "args": { + "External id": 232230,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679114.631, "dur": 6.624, + "args": { + "External id": 232231,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115679122.835, "dur": 46.250, + "args": { + "External id": 232232,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2343 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.13", "pid": 4183442, "tid": 31331, + "ts": 667115679310.050, "dur": 598.144, + "args": { + "External id": 232233,"Record function id": 0, "Ev Idx": 2344 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 4183442, "tid": 31331, + "ts": 667115679327.273, "dur": 568.493, + "args": { + "External id": 232234,"Record function id": 0, "Ev Idx": 2345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115679382.453, "dur": 4.203, + "args": { + "External id": 232235,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115679400.971, "dur": 29.946, + "args": { + "External id": 232236,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679406.142, "dur": 1.919, + "args": { + "External id": 232237,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679410.028, "dur": 2.232, + "args": { + "External id": 232238,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679413.782, "dur": 0.524, + "args": { + "External id": 232239,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679416.471, "dur": 0.539, + "args": { + "External id": 232240,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679418.215, "dur": 0.411, + "args": { + "External id": 232241,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679419.852, "dur": 0.398, + "args": { + "External id": 232242,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679422.278, "dur": 0.266, + "args": { + "External id": 232243,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679423.669, "dur": 0.633, + "args": { + "External id": 232244,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679425.741, "dur": 0.976, + "args": { + "External id": 232245,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115679443.386, "dur": 30.874, + "args": { + "External id": 232246,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115679523.966, "dur": 106.956, + "args": { + "External id": 232247,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115679534.450, "dur": 6.383, + "args": { + "External id": 232248,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115679546.288, "dur": 9.523, + "args": { + "External id": 232249,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115679550.121, "dur": 5.316, + "args": { + "External id": 232250,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679553.574, "dur": 0.499, + "args": { + "External id": 232251,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115679563.539, "dur": 25.251, + "args": { + "External id": 232252,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679565.844, "dur": 0.511, + "args": { + "External id": 232253,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679567.932, "dur": 0.924, + "args": { + "External id": 232254,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679570.280, "dur": 0.603, + "args": { + "External id": 232255,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679572.283, "dur": 0.632, + "args": { + "External id": 232256,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679574.921, "dur": 0.528, + "args": { + "External id": 232257,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679576.996, "dur": 0.243, + "args": { + "External id": 232258,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679578.648, "dur": 2.160, + "args": { + "External id": 232259,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679582.443, "dur": 0.502, + "args": { + "External id": 232260,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115679584.336, "dur": 0.554, + "args": { + "External id": 232261,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115679601.007, "dur": 22.353, + "args": { + "External id": 232262,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115679715.296, "dur": 114.765, + "args": { + "External id": 232263,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115679739.747, "dur": 86.765, + "args": { + "External id": 232264,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2375, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115679749.544, "dur": 73.088, + "args": { + "External id": 232265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115679842.922, "dur": 1.650, + "args": { + "External id": 232266,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2377, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115679923.878, "dur": 1536.990, + "args": { + "External id": 232267,"Sequence number": 2757774, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2378 + } + }, + { + "ph": "f", "id": 182, "pid": 4183442, "tid": 31331, "ts": 667115679923.878, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115680034.354, "dur": 96.622, + "args": { + "External id": 232268,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115680168.557, "dur": 36.618, + "args": { + "External id": 232269,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115680223.092, "dur": 39.077, + "args": { + "External id": 232270,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115680272.032, "dur": 25.787, + "args": { + "External id": 232271,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115680304.024, "dur": 32.619, + "args": { + "External id": 232272,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115680345.399, "dur": 22.417, + "args": { + "External id": 232273,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115680374.863, "dur": 28.714, + "args": { + "External id": 232274,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115680425.591, "dur": 23.451, + "args": { + "External id": 232275,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115680472.617, "dur": 46.756, + "args": { + "External id": 232276,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115680541.609, "dur": 21.771, + "args": { + "External id": 232277,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115680575.864, "dur": 15.917, + "args": { + "External id": 232278,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115680602.563, "dur": 40.705, + "args": { + "External id": 232279,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115680646.567, "dur": 69.752, + "args": { + "External id": 232280,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115680749.900, "dur": 170.608, + "args": { + "External id": 232281,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115680824.883, "dur": 6.209, + "args": { + "External id": 232282,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115680832.908, "dur": 3.964, + "args": { + "External id": 232283,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115680953.028, "dur": 30.605, + "args": { + "External id": 232284,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115680994.212, "dur": 14.862, + "args": { + "External id": 232285,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115681017.141, "dur": 49.178, + "args": { + "External id": 232286,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115681072.203, "dur": 34.208, + "args": { + "External id": 232287,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115681113.021, "dur": 27.440, + "args": { + "External id": 232288,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115681148.955, "dur": 27.517, + "args": { + "External id": 232289,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115681181.666, "dur": 27.320, + "args": { + "External id": 232290,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115681215.830, "dur": 27.377, + "args": { + "External id": 232291,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115681260.482, "dur": 22.367, + "args": { + "External id": 232292,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115681299.149, "dur": 38.088, + "args": { + "External id": 232293,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115681358.626, "dur": 16.962, + "args": { + "External id": 232294,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115681388.604, "dur": 12.980, + "args": { + "External id": 232295,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115681416.083, "dur": 17.782, + "args": { + "External id": 232296,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681526.593, "dur": 16.548, + "args": { + "External id": 232297,"Record function id": 0, "Ev Idx": 2408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681530.484, "dur": 11.578, + "args": { + "External id": 232298,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681534.860, "dur": 5.928, + "args": { + "External id": 232299,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681536.191, "dur": 4.358, + "args": { + "External id": 232300,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681547.205, "dur": 5.035, + "args": { + "External id": 232301,"Record function id": 0, "Ev Idx": 2412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681548.806, "dur": 3.004, + "args": { + "External id": 232302,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681549.895, "dur": 1.338, + "args": { + "External id": 232303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681550.397, "dur": 0.740, + "args": { + "External id": 232304,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681555.660, "dur": 4.223, + "args": { + "External id": 232305,"Record function id": 0, "Ev Idx": 2416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681557.187, "dur": 2.276, + "args": { + "External id": 232306,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681557.819, "dur": 1.237, + "args": { + "External id": 232307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681558.227, "dur": 0.740, + "args": { + "External id": 232308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681563.322, "dur": 4.982, + "args": { + "External id": 232309,"Record function id": 0, "Ev Idx": 2420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681564.343, "dur": 3.525, + "args": { + "External id": 232310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681564.897, "dur": 2.586, + "args": { + "External id": 232311,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681565.386, "dur": 2.001, + "args": { + "External id": 232312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681571.622, "dur": 4.169, + "args": { + "External id": 232313,"Record function id": 0, "Ev Idx": 2424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681572.763, "dur": 2.603, + "args": { + "External id": 232314,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681573.458, "dur": 1.242, + "args": { + "External id": 232315,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681573.867, "dur": 0.761, + "args": { + "External id": 232316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681578.904, "dur": 4.289, + "args": { + "External id": 232317,"Record function id": 0, "Ev Idx": 2428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681580.122, "dur": 2.656, + "args": { + "External id": 232318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681580.904, "dur": 1.346, + "args": { + "External id": 232319,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681581.361, "dur": 0.793, + "args": { + "External id": 232320,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681586.395, "dur": 3.546, + "args": { + "External id": 232321,"Record function id": 0, "Ev Idx": 2432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681587.487, "dur": 2.060, + "args": { + "External id": 232322,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681588.139, "dur": 0.983, + "args": { + "External id": 232323,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681588.453, "dur": 0.603, + "args": { + "External id": 232324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681592.955, "dur": 4.086, + "args": { + "External id": 232325,"Record function id": 0, "Ev Idx": 2436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681594.030, "dur": 2.611, + "args": { + "External id": 232326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681594.904, "dur": 1.335, + "args": { + "External id": 232327,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681595.481, "dur": 0.659, + "args": { + "External id": 232328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681600.239, "dur": 4.208, + "args": { + "External id": 232329,"Record function id": 0, "Ev Idx": 2440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115681601.336, "dur": 2.674, + "args": { + "External id": 232330,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115681601.984, "dur": 1.643, + "args": { + "External id": 232331,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115681602.942, "dur": 0.586, + "args": { + "External id": 232332,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115681608.578, "dur": 14789.226, + "args": { + "External id": 232333,"Record function id": 0, "Sequence number": 2757773, "Fwd thread id": 1, "Ev Idx": 2444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115681610.197, "dur": 14779.619, + "args": { + "External id": 232334,"Sequence number": 2757773, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2445 + } + }, + { + "ph": "f", "id": 183, "pid": 4183442, "tid": 31331, "ts": 667115681610.197, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.14)", "pid": 4183442, "tid": 31331, + "ts": 667115681641.655, "dur": 81.157, + "args": { + "External id": 232335,"Record function id": 0, "Ev Idx": 2446 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.14)", "pid": 4183442, "tid": 31331, + "ts": 667115681731.747, "dur": 70.624, + "args": { + "External id": 232336,"Record function id": 0, "Ev Idx": 2447 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.14)", "pid": 4183442, "tid": 31331, + "ts": 667115681808.539, "dur": 14574.223, + "args": { + "External id": 232337,"Record function id": 0, "Ev Idx": 2448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115681900.391, "dur": 7.337, + "args": { + "External id": 232338,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115681918.049, "dur": 5.036, + "args": { + "External id": 232339,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115681938.379, "dur": 13812.175, + "args": { + "External id": 232340,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115681954.369, "dur": 13788.347, + "args": { + "External id": 232341,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115681977.833, "dur": 15.494, + "args": { + "External id": 232342,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115681997.645, "dur": 13708.123, + "args": { + "External id": 232343,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115681999.839, "dur": 13705.144, + "args": { + "External id": 232344,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115682008.020, "dur": 4.903, + "args": { + "External id": 232345,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115682014.582, "dur": 13686.807, + "args": { + "External id": 232346,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115695837.283, "dur": 10.504, + "args": { + "External id": 232347,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115695841.278, "dur": 6.102, + "args": { + "External id": 232348,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115695873.850, "dur": 241.882, + "args": { + "External id": 232349,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115695899.697, "dur": 212.156, + "args": { + "External id": 232350,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2461, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115695911.446, "dur": 195.688, + "args": { + "External id": 232351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115696131.895, "dur": 2.060, + "args": { + "External id": 232352,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2463, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696181.987, "dur": 5.532, + "args": { + "External id": 232353,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696230.185, "dur": 1.276, + "args": { + "External id": 232354,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696247.112, "dur": 1.232, + "args": { + "External id": 232355,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696266.585, "dur": 0.793, + "args": { + "External id": 232356,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696278.424, "dur": 0.759, + "args": { + "External id": 232357,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696288.824, "dur": 0.881, + "args": { + "External id": 232358,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696300.578, "dur": 0.817, + "args": { + "External id": 232359,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696314.855, "dur": 1.803, + "args": { + "External id": 232360,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696326.308, "dur": 0.939, + "args": { + "External id": 232361,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115696411.882, "dur": 2610.123, + "args": { + "External id": 232362,"Record function id": 0, "Ev Idx": 2473 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.13)", "pid": 4183442, "tid": 31331, + "ts": 667115696431.727, "dur": 972.389, + "args": { + "External id": 232363,"Record function id": 0, "Ev Idx": 2474 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 4183442, "tid": 31331, + "ts": 667115696445.766, "dur": 358.906, + "args": { + "External id": 232364,"Record function id": 0, "Ev Idx": 2475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696544.814, "dur": 4.778, + "args": { + "External id": 232365,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696552.681, "dur": 1.176, + "args": { + "External id": 232366,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696556.078, "dur": 1.055, + "args": { + "External id": 232367,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696558.836, "dur": 2.488, + "args": { + "External id": 232368,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696562.847, "dur": 1.016, + "args": { + "External id": 232369,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696565.240, "dur": 0.898, + "args": { + "External id": 232370,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696567.623, "dur": 1.485, + "args": { + "External id": 232371,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696570.347, "dur": 0.935, + "args": { + "External id": 232372,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696572.803, "dur": 0.799, + "args": { + "External id": 232373,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115696575.194, "dur": 0.911, + "args": { + "External id": 232374,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115696593.976, "dur": 178.319, + "args": { + "External id": 232375,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115696613.762, "dur": 153.906, + "args": { + "External id": 232376,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115696627.267, "dur": 12.726, + "args": { + "External id": 232377,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115696642.646, "dur": 99.495, + "args": { + "External id": 232378,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115696645.220, "dur": 96.483, + "args": { + "External id": 232379,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696649.190, "dur": 41.792, + "args": { + "External id": 232380,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115696693.877, "dur": 47.163, + "args": { + "External id": 232381,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2492 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.12", "pid": 4183442, "tid": 31331, + "ts": 667115696891.858, "dur": 505.520, + "args": { + "External id": 232382,"Record function id": 0, "Ev Idx": 2493 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 4183442, "tid": 31331, + "ts": 667115696907.572, "dur": 476.812, + "args": { + "External id": 232383,"Record function id": 0, "Ev Idx": 2494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115696968.219, "dur": 4.804, + "args": { + "External id": 232384,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115696987.874, "dur": 28.081, + "args": { + "External id": 232385,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696992.520, "dur": 1.606, + "args": { + "External id": 232386,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696996.370, "dur": 0.553, + "args": { + "External id": 232387,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115696998.103, "dur": 0.504, + "args": { + "External id": 232388,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697000.284, "dur": 0.487, + "args": { + "External id": 232389,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697001.860, "dur": 0.283, + "args": { + "External id": 232390,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697003.739, "dur": 0.504, + "args": { + "External id": 232391,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697005.564, "dur": 1.764, + "args": { + "External id": 232392,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697009.325, "dur": 0.664, + "args": { + "External id": 232393,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697011.106, "dur": 0.535, + "args": { + "External id": 232394,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115697026.154, "dur": 28.877, + "args": { + "External id": 232395,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115697083.990, "dur": 90.189, + "args": { + "External id": 232396,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115697093.727, "dur": 2.778, + "args": { + "External id": 232397,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115697101.238, "dur": 10.473, + "args": { + "External id": 232398,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115697105.473, "dur": 5.829, + "args": { + "External id": 232399,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697109.697, "dur": 0.500, + "args": { + "External id": 232400,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115697118.126, "dur": 21.131, + "args": { + "External id": 232401,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697120.265, "dur": 0.445, + "args": { + "External id": 232402,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697122.169, "dur": 0.370, + "args": { + "External id": 232403,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697123.566, "dur": 0.421, + "args": { + "External id": 232404,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697125.515, "dur": 1.864, + "args": { + "External id": 232405,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697128.508, "dur": 0.408, + "args": { + "External id": 232406,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697130.526, "dur": 0.584, + "args": { + "External id": 232407,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697131.819, "dur": 0.363, + "args": { + "External id": 232408,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697133.510, "dur": 0.345, + "args": { + "External id": 232409,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115697135.052, "dur": 0.364, + "args": { + "External id": 232410,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115697148.963, "dur": 18.147, + "args": { + "External id": 232411,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115697219.513, "dur": 104.601, + "args": { + "External id": 232412,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115697239.228, "dur": 81.647, + "args": { + "External id": 232413,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2524, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115697248.228, "dur": 68.608, + "args": { + "External id": 232414,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115697335.902, "dur": 1.962, + "args": { + "External id": 232415,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2526, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115697410.882, "dur": 1586.620, + "args": { + "External id": 232416,"Sequence number": 2757772, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2527 + } + }, + { + "ph": "f", "id": 184, "pid": 4183442, "tid": 31331, "ts": 667115697410.882, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115697538.906, "dur": 98.178, + "args": { + "External id": 232417,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115697716.431, "dur": 39.268, + "args": { + "External id": 232418,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115697774.686, "dur": 44.316, + "args": { + "External id": 232419,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115697828.309, "dur": 25.922, + "args": { + "External id": 232420,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115697862.278, "dur": 33.205, + "args": { + "External id": 232421,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115697902.009, "dur": 20.286, + "args": { + "External id": 232422,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115697928.580, "dur": 28.585, + "args": { + "External id": 232423,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115697979.244, "dur": 20.343, + "args": { + "External id": 232424,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115698016.914, "dur": 25.429, + "args": { + "External id": 232425,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115698058.504, "dur": 17.340, + "args": { + "External id": 232426,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115698087.026, "dur": 13.797, + "args": { + "External id": 232427,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698108.906, "dur": 35.350, + "args": { + "External id": 232428,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698147.307, "dur": 30.022, + "args": { + "External id": 232429,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115698203.627, "dur": 166.603, + "args": { + "External id": 232430,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115698274.479, "dur": 5.643, + "args": { + "External id": 232431,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115698285.152, "dur": 2.178, + "args": { + "External id": 232432,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115698401.218, "dur": 24.208, + "args": { + "External id": 232433,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115698435.136, "dur": 18.509, + "args": { + "External id": 232434,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698461.145, "dur": 63.217, + "args": { + "External id": 232435,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698532.463, "dur": 34.309, + "args": { + "External id": 232436,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698574.824, "dur": 31.905, + "args": { + "External id": 232437,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698611.082, "dur": 28.005, + "args": { + "External id": 232438,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698644.308, "dur": 65.640, + "args": { + "External id": 232439,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115698720.378, "dur": 32.703, + "args": { + "External id": 232440,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115698773.285, "dur": 25.159, + "args": { + "External id": 232441,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115698821.386, "dur": 39.641, + "args": { + "External id": 232442,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115698887.243, "dur": 20.872, + "args": { + "External id": 232443,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115698925.560, "dur": 15.153, + "args": { + "External id": 232444,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115698953.249, "dur": 16.760, + "args": { + "External id": 232445,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699043.163, "dur": 37.167, + "args": { + "External id": 232446,"Record function id": 0, "Ev Idx": 2557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699046.554, "dur": 32.882, + "args": { + "External id": 232447,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699050.531, "dur": 27.805, + "args": { + "External id": 232448,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699074.165, "dur": 4.072, + "args": { + "External id": 232449,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699084.273, "dur": 4.214, + "args": { + "External id": 232450,"Record function id": 0, "Ev Idx": 2561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699085.526, "dur": 2.537, + "args": { + "External id": 232451,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699086.418, "dur": 1.043, + "args": { + "External id": 232452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699086.772, "dur": 0.564, + "args": { + "External id": 232453,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699091.708, "dur": 5.938, + "args": { + "External id": 232454,"Record function id": 0, "Ev Idx": 2565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699092.739, "dur": 4.508, + "args": { + "External id": 232455,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699093.614, "dur": 3.202, + "args": { + "External id": 232456,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699093.973, "dur": 2.727, + "args": { + "External id": 232457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699100.799, "dur": 3.631, + "args": { + "External id": 232458,"Record function id": 0, "Ev Idx": 2569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699101.982, "dur": 2.011, + "args": { + "External id": 232459,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699102.628, "dur": 0.919, + "args": { + "External id": 232460,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699102.940, "dur": 0.513, + "args": { + "External id": 232461,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699107.492, "dur": 3.781, + "args": { + "External id": 232462,"Record function id": 0, "Ev Idx": 2573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699108.419, "dur": 2.442, + "args": { + "External id": 232463,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699108.895, "dur": 1.508, + "args": { + "External id": 232464,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699109.618, "dur": 0.712, + "args": { + "External id": 232465,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699114.368, "dur": 4.126, + "args": { + "External id": 232466,"Record function id": 0, "Ev Idx": 2577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699115.362, "dur": 2.736, + "args": { + "External id": 232467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699116.263, "dur": 1.407, + "args": { + "External id": 232468,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699116.937, "dur": 0.628, + "args": { + "External id": 232469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699121.881, "dur": 4.446, + "args": { + "External id": 232470,"Record function id": 0, "Ev Idx": 2581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699123.185, "dur": 2.754, + "args": { + "External id": 232471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699124.097, "dur": 1.317, + "args": { + "External id": 232472,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699124.694, "dur": 0.656, + "args": { + "External id": 232473,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699129.894, "dur": 4.197, + "args": { + "External id": 232474,"Record function id": 0, "Ev Idx": 2585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699130.874, "dur": 2.821, + "args": { + "External id": 232475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699131.704, "dur": 1.566, + "args": { + "External id": 232476,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699132.611, "dur": 0.584, + "args": { + "External id": 232477,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699137.311, "dur": 3.979, + "args": { + "External id": 232478,"Record function id": 0, "Ev Idx": 2589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115699138.425, "dur": 2.476, + "args": { + "External id": 232479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115699139.259, "dur": 1.224, + "args": { + "External id": 232480,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115699139.851, "dur": 0.527, + "args": { + "External id": 232481,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115699145.237, "dur": 14915.933, + "args": { + "External id": 232482,"Record function id": 0, "Sequence number": 2757771, "Fwd thread id": 1, "Ev Idx": 2593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115699146.640, "dur": 14905.381, + "args": { + "External id": 232483,"Sequence number": 2757771, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2594 + } + }, + { + "ph": "f", "id": 185, "pid": 4183442, "tid": 31331, "ts": 667115699146.640, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.13)", "pid": 4183442, "tid": 31331, + "ts": 667115699175.858, "dur": 41.333, + "args": { + "External id": 232484,"Record function id": 0, "Ev Idx": 2595 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.13)", "pid": 4183442, "tid": 31331, + "ts": 667115699224.489, "dur": 71.975, + "args": { + "External id": 232485,"Record function id": 0, "Ev Idx": 2596 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.13)", "pid": 4183442, "tid": 31331, + "ts": 667115699302.917, "dur": 14741.991, + "args": { + "External id": 232486,"Record function id": 0, "Ev Idx": 2597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115699389.910, "dur": 7.004, + "args": { + "External id": 232487,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115699406.352, "dur": 6.279, + "args": { + "External id": 232488,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115699427.024, "dur": 13879.347, + "args": { + "External id": 232489,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115699439.925, "dur": 13858.283, + "args": { + "External id": 232490,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115699463.367, "dur": 13.388, + "args": { + "External id": 232491,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115699480.877, "dur": 13782.905, + "args": { + "External id": 232492,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115699482.973, "dur": 13779.987, + "args": { + "External id": 232493,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115699486.876, "dur": 23.378, + "args": { + "External id": 232494,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115699512.847, "dur": 13746.602, + "args": { + "External id": 232495,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115713392.052, "dur": 8.685, + "args": { + "External id": 232496,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115713394.892, "dur": 5.530, + "args": { + "External id": 232497,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115713426.910, "dur": 338.025, + "args": { + "External id": 232498,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115713453.822, "dur": 306.349, + "args": { + "External id": 232499,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2610, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115713464.655, "dur": 290.152, + "args": { + "External id": 232500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115713785.323, "dur": 2.330, + "args": { + "External id": 232501,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2612, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713842.704, "dur": 6.188, + "args": { + "External id": 232502,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713894.576, "dur": 1.356, + "args": { + "External id": 232503,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713911.460, "dur": 2.874, + "args": { + "External id": 232504,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713925.781, "dur": 0.860, + "args": { + "External id": 232505,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713937.940, "dur": 1.062, + "args": { + "External id": 232506,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713948.748, "dur": 0.810, + "args": { + "External id": 232507,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713959.683, "dur": 2.786, + "args": { + "External id": 232508,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713973.216, "dur": 2.323, + "args": { + "External id": 232509,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115713986.048, "dur": 0.667, + "args": { + "External id": 232510,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115714075.821, "dur": 2629.803, + "args": { + "External id": 232511,"Record function id": 0, "Ev Idx": 2622 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.12)", "pid": 4183442, "tid": 31331, + "ts": 667115714095.219, "dur": 974.386, + "args": { + "External id": 232512,"Record function id": 0, "Ev Idx": 2623 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 4183442, "tid": 31331, + "ts": 667115714111.192, "dur": 285.598, + "args": { + "External id": 232513,"Record function id": 0, "Ev Idx": 2624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714190.993, "dur": 3.973, + "args": { + "External id": 232514,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714197.883, "dur": 1.061, + "args": { + "External id": 232515,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714200.873, "dur": 2.504, + "args": { + "External id": 232516,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714205.027, "dur": 0.992, + "args": { + "External id": 232517,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714207.774, "dur": 0.755, + "args": { + "External id": 232518,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714210.207, "dur": 0.656, + "args": { + "External id": 232519,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714212.908, "dur": 1.672, + "args": { + "External id": 232520,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714216.246, "dur": 1.160, + "args": { + "External id": 232521,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714218.903, "dur": 0.908, + "args": { + "External id": 232522,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115714221.105, "dur": 1.002, + "args": { + "External id": 232523,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115714238.766, "dur": 133.296, + "args": { + "External id": 232524,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115714253.815, "dur": 114.268, + "args": { + "External id": 232525,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115714265.873, "dur": 14.693, + "args": { + "External id": 232526,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115714283.287, "dur": 59.131, + "args": { + "External id": 232527,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115714286.524, "dur": 55.628, + "args": { + "External id": 232528,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714290.176, "dur": 4.910, + "args": { + "External id": 232529,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115714296.856, "dur": 44.619, + "args": { + "External id": 232530,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2641 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.11", "pid": 4183442, "tid": 31331, + "ts": 667115714476.431, "dur": 585.918, + "args": { + "External id": 232531,"Record function id": 0, "Ev Idx": 2642 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 4183442, "tid": 31331, + "ts": 667115714514.164, "dur": 536.124, + "args": { + "External id": 232532,"Record function id": 0, "Ev Idx": 2643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115714575.560, "dur": 5.830, + "args": { + "External id": 232533,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115714596.192, "dur": 27.654, + "args": { + "External id": 232534,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714601.069, "dur": 1.380, + "args": { + "External id": 232535,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714604.284, "dur": 0.499, + "args": { + "External id": 232536,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714606.222, "dur": 0.416, + "args": { + "External id": 232537,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714607.763, "dur": 0.392, + "args": { + "External id": 232538,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714609.775, "dur": 0.394, + "args": { + "External id": 232539,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714611.633, "dur": 2.253, + "args": { + "External id": 232540,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714615.425, "dur": 0.547, + "args": { + "External id": 232541,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714617.288, "dur": 0.757, + "args": { + "External id": 232542,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714619.370, "dur": 0.238, + "args": { + "External id": 232543,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115714633.476, "dur": 66.095, + "args": { + "External id": 232544,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115714735.498, "dur": 96.088, + "args": { + "External id": 232545,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115714745.713, "dur": 4.229, + "args": { + "External id": 232546,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115714754.780, "dur": 9.801, + "args": { + "External id": 232547,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115714758.830, "dur": 5.323, + "args": { + "External id": 232548,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714762.006, "dur": 0.842, + "args": { + "External id": 232549,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115714771.757, "dur": 22.358, + "args": { + "External id": 232550,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714773.511, "dur": 0.344, + "args": { + "External id": 232551,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714775.455, "dur": 0.476, + "args": { + "External id": 232552,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714777.234, "dur": 1.913, + "args": { + "External id": 232553,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714780.485, "dur": 0.614, + "args": { + "External id": 232554,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714782.511, "dur": 0.323, + "args": { + "External id": 232555,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714783.945, "dur": 1.483, + "args": { + "External id": 232556,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714786.974, "dur": 0.386, + "args": { + "External id": 232557,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714788.635, "dur": 0.434, + "args": { + "External id": 232558,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115714790.447, "dur": 0.280, + "args": { + "External id": 232559,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115714805.454, "dur": 18.632, + "args": { + "External id": 232560,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115714875.194, "dur": 110.553, + "args": { + "External id": 232561,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115714899.110, "dur": 83.468, + "args": { + "External id": 232562,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2673, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115714908.541, "dur": 69.425, + "args": { + "External id": 232563,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115715000.593, "dur": 2.029, + "args": { + "External id": 232564,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2675, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115715078.054, "dur": 1567.061, + "args": { + "External id": 232565,"Sequence number": 2757770, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2676 + } + }, + { + "ph": "f", "id": 186, "pid": 4183442, "tid": 31331, "ts": 667115715078.054, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115715187.543, "dur": 99.596, + "args": { + "External id": 232566,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115715326.613, "dur": 43.792, + "args": { + "External id": 232567,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115715388.033, "dur": 41.254, + "args": { + "External id": 232568,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115715439.332, "dur": 27.422, + "args": { + "External id": 232569,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115715472.636, "dur": 53.275, + "args": { + "External id": 232570,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115715535.909, "dur": 24.376, + "args": { + "External id": 232571,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115715567.844, "dur": 29.189, + "args": { + "External id": 232572,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115715625.408, "dur": 22.031, + "args": { + "External id": 232573,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115715704.416, "dur": 28.414, + "args": { + "External id": 232574,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115715754.387, "dur": 17.324, + "args": { + "External id": 232575,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115715786.179, "dur": 14.215, + "args": { + "External id": 232576,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115715809.947, "dur": 41.010, + "args": { + "External id": 232577,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115715854.736, "dur": 30.046, + "args": { + "External id": 232578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115715916.036, "dur": 172.385, + "args": { + "External id": 232579,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115715992.208, "dur": 6.155, + "args": { + "External id": 232580,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115716000.317, "dur": 3.473, + "args": { + "External id": 232581,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115716121.259, "dur": 22.605, + "args": { + "External id": 232582,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115716157.438, "dur": 12.676, + "args": { + "External id": 232583,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115716177.956, "dur": 42.905, + "args": { + "External id": 232584,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115716226.389, "dur": 30.133, + "args": { + "External id": 232585,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115716264.337, "dur": 27.840, + "args": { + "External id": 232586,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115716296.813, "dur": 28.017, + "args": { + "External id": 232587,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115716330.833, "dur": 29.942, + "args": { + "External id": 232588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115716367.121, "dur": 27.569, + "args": { + "External id": 232589,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115716417.394, "dur": 20.763, + "args": { + "External id": 232590,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115716454.903, "dur": 30.241, + "args": { + "External id": 232591,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115716525.377, "dur": 25.309, + "args": { + "External id": 232592,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115716567.209, "dur": 16.475, + "args": { + "External id": 232593,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115716595.717, "dur": 21.442, + "args": { + "External id": 232594,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716728.937, "dur": 15.008, + "args": { + "External id": 232595,"Record function id": 0, "Ev Idx": 2706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716732.244, "dur": 10.808, + "args": { + "External id": 232596,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716736.619, "dur": 5.490, + "args": { + "External id": 232597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716738.172, "dur": 3.838, + "args": { + "External id": 232598,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716748.000, "dur": 6.828, + "args": { + "External id": 232599,"Record function id": 0, "Ev Idx": 2710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716749.590, "dur": 4.804, + "args": { + "External id": 232600,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716750.371, "dur": 3.285, + "args": { + "External id": 232601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716751.036, "dur": 2.528, + "args": { + "External id": 232602,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716758.266, "dur": 5.119, + "args": { + "External id": 232603,"Record function id": 0, "Ev Idx": 2714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716760.143, "dur": 2.804, + "args": { + "External id": 232604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716760.819, "dur": 1.717, + "args": { + "External id": 232605,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716761.515, "dur": 0.928, + "args": { + "External id": 232606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716766.595, "dur": 4.184, + "args": { + "External id": 232607,"Record function id": 0, "Ev Idx": 2718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716768.135, "dur": 2.203, + "args": { + "External id": 232608,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716768.842, "dur": 1.033, + "args": { + "External id": 232609,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716769.125, "dur": 0.676, + "args": { + "External id": 232610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716773.889, "dur": 4.187, + "args": { + "External id": 232611,"Record function id": 0, "Ev Idx": 2722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716774.897, "dur": 2.685, + "args": { + "External id": 232612,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716775.582, "dur": 1.568, + "args": { + "External id": 232613,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716776.141, "dur": 0.941, + "args": { + "External id": 232614,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716781.412, "dur": 4.575, + "args": { + "External id": 232615,"Record function id": 0, "Ev Idx": 2726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716782.568, "dur": 3.011, + "args": { + "External id": 232616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716783.385, "dur": 1.661, + "args": { + "External id": 232617,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716784.298, "dur": 0.681, + "args": { + "External id": 232618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716789.243, "dur": 4.229, + "args": { + "External id": 232619,"Record function id": 0, "Ev Idx": 2730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716790.695, "dur": 2.373, + "args": { + "External id": 232620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716791.179, "dur": 1.307, + "args": { + "External id": 232621,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716791.812, "dur": 0.608, + "args": { + "External id": 232622,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716796.848, "dur": 3.586, + "args": { + "External id": 232623,"Record function id": 0, "Ev Idx": 2734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716797.952, "dur": 2.091, + "args": { + "External id": 232624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716798.481, "dur": 1.141, + "args": { + "External id": 232625,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716798.970, "dur": 0.589, + "args": { + "External id": 232626,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716803.730, "dur": 5.632, + "args": { + "External id": 232627,"Record function id": 0, "Ev Idx": 2738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115716804.985, "dur": 3.955, + "args": { + "External id": 232628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115716805.639, "dur": 2.874, + "args": { + "External id": 232629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115716806.168, "dur": 2.277, + "args": { + "External id": 232630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115716813.228, "dur": 14769.376, + "args": { + "External id": 232631,"Record function id": 0, "Sequence number": 2757769, "Fwd thread id": 1, "Ev Idx": 2742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115716814.592, "dur": 14759.646, + "args": { + "External id": 232632,"Sequence number": 2757769, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2743 + } + }, + { + "ph": "f", "id": 187, "pid": 4183442, "tid": 31331, "ts": 667115716814.592, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.12)", "pid": 4183442, "tid": 31331, + "ts": 667115716845.765, "dur": 37.680, + "args": { + "External id": 232633,"Record function id": 0, "Ev Idx": 2744 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.12)", "pid": 4183442, "tid": 31331, + "ts": 667115716890.683, "dur": 67.517, + "args": { + "External id": 232634,"Record function id": 0, "Ev Idx": 2745 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.12)", "pid": 4183442, "tid": 31331, + "ts": 667115716967.796, "dur": 14598.268, + "args": { + "External id": 232635,"Record function id": 0, "Ev Idx": 2746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115717053.507, "dur": 10.112, + "args": { + "External id": 232636,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115717072.256, "dur": 4.947, + "args": { + "External id": 232637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115717090.789, "dur": 13820.589, + "args": { + "External id": 232638,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115717104.068, "dur": 13799.533, + "args": { + "External id": 232639,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115717134.892, "dur": 14.001, + "args": { + "External id": 232640,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115717152.778, "dur": 13716.155, + "args": { + "External id": 232641,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115717155.173, "dur": 13713.025, + "args": { + "External id": 232642,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115717159.560, "dur": 4.772, + "args": { + "External id": 232643,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115717165.967, "dur": 13698.898, + "args": { + "External id": 232644,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115730998.500, "dur": 8.778, + "args": { + "External id": 232645,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115731001.337, "dur": 5.594, + "args": { + "External id": 232646,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115731036.806, "dur": 243.344, + "args": { + "External id": 232647,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115731064.242, "dur": 211.953, + "args": { + "External id": 232648,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2759, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115731074.891, "dur": 196.851, + "args": { + "External id": 232649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115731296.575, "dur": 1.839, + "args": { + "External id": 232650,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2761, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731347.008, "dur": 5.900, + "args": { + "External id": 232651,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731395.044, "dur": 3.095, + "args": { + "External id": 232652,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731412.734, "dur": 1.339, + "args": { + "External id": 232653,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731425.644, "dur": 1.062, + "args": { + "External id": 232654,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731437.352, "dur": 0.881, + "args": { + "External id": 232655,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731448.729, "dur": 2.165, + "args": { + "External id": 232656,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731461.817, "dur": 0.660, + "args": { + "External id": 232657,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731474.099, "dur": 1.651, + "args": { + "External id": 232658,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731484.524, "dur": 0.895, + "args": { + "External id": 232659,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115731598.025, "dur": 2600.711, + "args": { + "External id": 232660,"Record function id": 0, "Ev Idx": 2771 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.11)", "pid": 4183442, "tid": 31331, + "ts": 667115731618.853, "dur": 957.640, + "args": { + "External id": 232661,"Record function id": 0, "Ev Idx": 2772 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 4183442, "tid": 31331, + "ts": 667115731633.182, "dur": 341.137, + "args": { + "External id": 232662,"Record function id": 0, "Ev Idx": 2773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731756.209, "dur": 6.267, + "args": { + "External id": 232663,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731765.888, "dur": 0.945, + "args": { + "External id": 232664,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731768.383, "dur": 1.056, + "args": { + "External id": 232665,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731771.086, "dur": 1.000, + "args": { + "External id": 232666,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731773.537, "dur": 1.137, + "args": { + "External id": 232667,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731777.237, "dur": 0.918, + "args": { + "External id": 232668,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731779.861, "dur": 1.300, + "args": { + "External id": 232669,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731782.581, "dur": 0.934, + "args": { + "External id": 232670,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731784.863, "dur": 2.189, + "args": { + "External id": 232671,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115731788.358, "dur": 0.842, + "args": { + "External id": 232672,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115731807.820, "dur": 137.603, + "args": { + "External id": 232673,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115731823.050, "dur": 118.324, + "args": { + "External id": 232674,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115731836.196, "dur": 13.183, + "args": { + "External id": 232675,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115731852.002, "dur": 62.087, + "args": { + "External id": 232676,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115731854.739, "dur": 59.053, + "args": { + "External id": 232677,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115731858.639, "dur": 6.066, + "args": { + "External id": 232678,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115731866.322, "dur": 46.943, + "args": { + "External id": 232679,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2790 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.10", "pid": 4183442, "tid": 31331, + "ts": 667115732059.332, "dur": 509.779, + "args": { + "External id": 232680,"Record function id": 0, "Ev Idx": 2791 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 4183442, "tid": 31331, + "ts": 667115732075.175, "dur": 482.639, + "args": { + "External id": 232681,"Record function id": 0, "Ev Idx": 2792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115732130.344, "dur": 4.061, + "args": { + "External id": 232682,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115732148.435, "dur": 27.786, + "args": { + "External id": 232683,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732153.053, "dur": 1.585, + "args": { + "External id": 232684,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732156.461, "dur": 0.731, + "args": { + "External id": 232685,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732158.093, "dur": 1.494, + "args": { + "External id": 232686,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732160.302, "dur": 2.295, + "args": { + "External id": 232687,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732163.631, "dur": 0.255, + "args": { + "External id": 232688,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732165.844, "dur": 0.310, + "args": { + "External id": 232689,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732167.177, "dur": 0.562, + "args": { + "External id": 232690,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732168.399, "dur": 0.627, + "args": { + "External id": 232691,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732171.717, "dur": 0.684, + "args": { + "External id": 232692,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115732185.414, "dur": 26.766, + "args": { + "External id": 232693,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115732240.988, "dur": 87.302, + "args": { + "External id": 232694,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115732249.714, "dur": 3.311, + "args": { + "External id": 232695,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115732257.595, "dur": 9.217, + "args": { + "External id": 232696,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115732261.624, "dur": 4.803, + "args": { + "External id": 232697,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732264.812, "dur": 0.595, + "args": { + "External id": 232698,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115732273.052, "dur": 22.771, + "args": { + "External id": 232699,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732274.757, "dur": 1.922, + "args": { + "External id": 232700,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732277.881, "dur": 0.544, + "args": { + "External id": 232701,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732279.938, "dur": 0.748, + "args": { + "External id": 232702,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732281.598, "dur": 0.250, + "args": { + "External id": 232703,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732283.124, "dur": 0.841, + "args": { + "External id": 232704,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732285.130, "dur": 0.433, + "args": { + "External id": 232705,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732286.698, "dur": 0.356, + "args": { + "External id": 232706,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732288.516, "dur": 0.544, + "args": { + "External id": 232707,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115732290.756, "dur": 2.013, + "args": { + "External id": 232708,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115732305.014, "dur": 16.253, + "args": { + "External id": 232709,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115732368.709, "dur": 105.297, + "args": { + "External id": 232710,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115732391.360, "dur": 79.039, + "args": { + "External id": 232711,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2822, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115732399.872, "dur": 66.769, + "args": { + "External id": 232712,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115732487.696, "dur": 2.077, + "args": { + "External id": 232713,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2824, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115732583.681, "dur": 1593.257, + "args": { + "External id": 232714,"Sequence number": 2757768, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2825 + } + }, + { + "ph": "f", "id": 188, "pid": 4183442, "tid": 31331, "ts": 667115732583.681, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115732731.424, "dur": 101.518, + "args": { + "External id": 232715,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115732874.564, "dur": 38.681, + "args": { + "External id": 232716,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115732931.843, "dur": 40.307, + "args": { + "External id": 232717,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115732981.006, "dur": 27.228, + "args": { + "External id": 232718,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733014.489, "dur": 34.270, + "args": { + "External id": 232719,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733055.617, "dur": 21.682, + "args": { + "External id": 232720,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733086.289, "dur": 29.356, + "args": { + "External id": 232721,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115733138.258, "dur": 22.938, + "args": { + "External id": 232722,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115733177.886, "dur": 26.814, + "args": { + "External id": 232723,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115733222.392, "dur": 19.741, + "args": { + "External id": 232724,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115733254.713, "dur": 16.233, + "args": { + "External id": 232725,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733280.483, "dur": 37.725, + "args": { + "External id": 232726,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733321.264, "dur": 30.207, + "args": { + "External id": 232727,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115733376.775, "dur": 175.036, + "args": { + "External id": 232728,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115733445.678, "dur": 5.860, + "args": { + "External id": 232729,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115733453.676, "dur": 2.834, + "args": { + "External id": 232730,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115733583.825, "dur": 29.564, + "args": { + "External id": 232731,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115733628.485, "dur": 15.144, + "args": { + "External id": 232732,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733694.661, "dur": 60.097, + "args": { + "External id": 232733,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733764.063, "dur": 32.251, + "args": { + "External id": 232734,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733807.015, "dur": 28.038, + "args": { + "External id": 232735,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733839.430, "dur": 29.826, + "args": { + "External id": 232736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733874.596, "dur": 27.681, + "args": { + "External id": 232737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115733910.667, "dur": 30.726, + "args": { + "External id": 232738,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115733958.782, "dur": 40.065, + "args": { + "External id": 232739,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115734022.098, "dur": 30.159, + "args": { + "External id": 232740,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115734066.761, "dur": 18.154, + "args": { + "External id": 232741,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115734099.425, "dur": 17.462, + "args": { + "External id": 232742,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115734129.986, "dur": 15.926, + "args": { + "External id": 232743,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734219.789, "dur": 16.079, + "args": { + "External id": 232744,"Record function id": 0, "Ev Idx": 2855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734223.134, "dur": 11.934, + "args": { + "External id": 232745,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734227.316, "dur": 6.958, + "args": { + "External id": 232746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734228.778, "dur": 5.390, + "args": { + "External id": 232747,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734240.018, "dur": 5.220, + "args": { + "External id": 232748,"Record function id": 0, "Ev Idx": 2859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734241.878, "dur": 2.886, + "args": { + "External id": 232749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734242.725, "dur": 1.539, + "args": { + "External id": 232750,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734243.467, "dur": 0.731, + "args": { + "External id": 232751,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734248.731, "dur": 4.523, + "args": { + "External id": 232752,"Record function id": 0, "Ev Idx": 2863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734250.013, "dur": 2.787, + "args": { + "External id": 232753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734250.861, "dur": 1.500, + "args": { + "External id": 232754,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734251.461, "dur": 0.815, + "args": { + "External id": 232755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734256.458, "dur": 5.015, + "args": { + "External id": 232756,"Record function id": 0, "Ev Idx": 2867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734257.914, "dur": 3.119, + "args": { + "External id": 232757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734258.651, "dur": 1.746, + "args": { + "External id": 232758,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734259.716, "dur": 0.606, + "args": { + "External id": 232759,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734264.593, "dur": 4.067, + "args": { + "External id": 232760,"Record function id": 0, "Ev Idx": 2871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734265.897, "dur": 2.336, + "args": { + "External id": 232761,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734266.402, "dur": 1.385, + "args": { + "External id": 232762,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734267.075, "dur": 0.624, + "args": { + "External id": 232763,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734272.070, "dur": 4.563, + "args": { + "External id": 232764,"Record function id": 0, "Ev Idx": 2875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734273.285, "dur": 2.925, + "args": { + "External id": 232765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734274.000, "dur": 1.809, + "args": { + "External id": 232766,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734274.873, "dur": 0.870, + "args": { + "External id": 232767,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734279.751, "dur": 3.715, + "args": { + "External id": 232768,"Record function id": 0, "Ev Idx": 2879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734280.877, "dur": 2.182, + "args": { + "External id": 232769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734281.553, "dur": 1.091, + "args": { + "External id": 232770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734281.953, "dur": 0.621, + "args": { + "External id": 232771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734286.889, "dur": 5.675, + "args": { + "External id": 232772,"Record function id": 0, "Ev Idx": 2883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734288.209, "dur": 3.944, + "args": { + "External id": 232773,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734288.703, "dur": 3.031, + "args": { + "External id": 232774,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734289.256, "dur": 2.379, + "args": { + "External id": 232775,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734295.979, "dur": 4.162, + "args": { + "External id": 232776,"Record function id": 0, "Ev Idx": 2887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115734297.534, "dur": 2.186, + "args": { + "External id": 232777,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115734298.057, "dur": 1.251, + "args": { + "External id": 232778,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115734298.516, "dur": 0.695, + "args": { + "External id": 232779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115734304.416, "dur": 14964.123, + "args": { + "External id": 232780,"Record function id": 0, "Sequence number": 2757767, "Fwd thread id": 1, "Ev Idx": 2891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115734306.035, "dur": 14953.345, + "args": { + "External id": 232781,"Sequence number": 2757767, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2892 + } + }, + { + "ph": "f", "id": 189, "pid": 4183442, "tid": 31331, "ts": 667115734306.035, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.11)", "pid": 4183442, "tid": 31331, + "ts": 667115734335.834, "dur": 38.228, + "args": { + "External id": 232782,"Record function id": 0, "Ev Idx": 2893 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.11)", "pid": 4183442, "tid": 31331, + "ts": 667115734381.398, "dur": 64.458, + "args": { + "External id": 232783,"Record function id": 0, "Ev Idx": 2894 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.11)", "pid": 4183442, "tid": 31331, + "ts": 667115734455.054, "dur": 14796.956, + "args": { + "External id": 232784,"Record function id": 0, "Ev Idx": 2895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115734560.279, "dur": 7.702, + "args": { + "External id": 232785,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115734578.033, "dur": 5.364, + "args": { + "External id": 232786,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115734597.691, "dur": 13989.175, + "args": { + "External id": 232787,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115734610.877, "dur": 13967.582, + "args": { + "External id": 232788,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115734634.218, "dur": 14.184, + "args": { + "External id": 232789,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115734688.152, "dur": 13857.160, + "args": { + "External id": 232790,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115734690.542, "dur": 13854.163, + "args": { + "External id": 232791,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115734694.484, "dur": 6.013, + "args": { + "External id": 232792,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115734702.204, "dur": 13839.233, + "args": { + "External id": 232793,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115748699.728, "dur": 9.286, + "args": { + "External id": 232794,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115748702.551, "dur": 5.911, + "args": { + "External id": 232795,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115748736.827, "dur": 249.079, + "args": { + "External id": 232796,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115748762.883, "dur": 218.834, + "args": { + "External id": 232797,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2908, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115748774.090, "dur": 203.157, + "args": { + "External id": 232798,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115749002.639, "dur": 1.719, + "args": { + "External id": 232799,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2910, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749054.542, "dur": 5.316, + "args": { + "External id": 232800,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749103.714, "dur": 1.233, + "args": { + "External id": 232801,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749120.452, "dur": 1.165, + "args": { + "External id": 232802,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749133.644, "dur": 0.780, + "args": { + "External id": 232803,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749145.515, "dur": 0.964, + "args": { + "External id": 232804,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749157.246, "dur": 1.110, + "args": { + "External id": 232805,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749168.661, "dur": 0.893, + "args": { + "External id": 232806,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749179.826, "dur": 1.795, + "args": { + "External id": 232807,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749191.388, "dur": 0.647, + "args": { + "External id": 232808,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115749281.959, "dur": 2638.736, + "args": { + "External id": 232809,"Record function id": 0, "Ev Idx": 2920 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.10)", "pid": 4183442, "tid": 31331, + "ts": 667115749301.840, "dur": 978.077, + "args": { + "External id": 232810,"Record function id": 0, "Ev Idx": 2921 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 4183442, "tid": 31331, + "ts": 667115749316.157, "dur": 309.137, + "args": { + "External id": 232811,"Record function id": 0, "Ev Idx": 2922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749392.761, "dur": 4.126, + "args": { + "External id": 232812,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749399.717, "dur": 1.353, + "args": { + "External id": 232813,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749402.913, "dur": 0.971, + "args": { + "External id": 232814,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749405.738, "dur": 0.833, + "args": { + "External id": 232815,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749408.299, "dur": 1.158, + "args": { + "External id": 232816,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749411.335, "dur": 1.100, + "args": { + "External id": 232817,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749414.550, "dur": 1.478, + "args": { + "External id": 232818,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749417.734, "dur": 2.724, + "args": { + "External id": 232819,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749422.266, "dur": 0.993, + "args": { + "External id": 232820,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115749424.835, "dur": 0.751, + "args": { + "External id": 232821,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115749443.454, "dur": 153.192, + "args": { + "External id": 232822,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115749457.408, "dur": 134.824, + "args": { + "External id": 232823,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115749467.938, "dur": 13.952, + "args": { + "External id": 232824,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115749484.558, "dur": 81.168, + "args": { + "External id": 232825,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115749487.241, "dur": 78.127, + "args": { + "External id": 232826,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749509.381, "dur": 7.198, + "args": { + "External id": 232827,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115749519.082, "dur": 45.625, + "args": { + "External id": 232828,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2939 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.9", "pid": 4183442, "tid": 31331, + "ts": 667115749751.573, "dur": 521.115, + "args": { + "External id": 232829,"Record function id": 0, "Ev Idx": 2940 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 4183442, "tid": 31331, + "ts": 667115749767.747, "dur": 493.136, + "args": { + "External id": 232830,"Record function id": 0, "Ev Idx": 2941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115749827.655, "dur": 5.502, + "args": { + "External id": 232831,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115749847.197, "dur": 29.995, + "args": { + "External id": 232832,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749852.301, "dur": 1.692, + "args": { + "External id": 232833,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749856.077, "dur": 0.582, + "args": { + "External id": 232834,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749858.103, "dur": 2.089, + "args": { + "External id": 232835,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749861.673, "dur": 0.370, + "args": { + "External id": 232836,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749863.555, "dur": 0.961, + "args": { + "External id": 232837,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749865.863, "dur": 0.568, + "args": { + "External id": 232838,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749869.098, "dur": 0.634, + "args": { + "External id": 232839,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749870.525, "dur": 0.725, + "args": { + "External id": 232840,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749872.598, "dur": 0.708, + "args": { + "External id": 232841,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115749887.436, "dur": 30.613, + "args": { + "External id": 232842,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115749949.011, "dur": 96.620, + "args": { + "External id": 232843,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115749958.360, "dur": 2.874, + "args": { + "External id": 232844,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115749966.163, "dur": 11.244, + "args": { + "External id": 232845,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115749970.383, "dur": 6.606, + "args": { + "External id": 232846,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749973.751, "dur": 2.203, + "args": { + "External id": 232847,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115749984.038, "dur": 21.215, + "args": { + "External id": 232848,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749985.709, "dur": 0.660, + "args": { + "External id": 232849,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749987.743, "dur": 0.524, + "args": { + "External id": 232850,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749989.862, "dur": 0.470, + "args": { + "External id": 232851,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749991.632, "dur": 0.307, + "args": { + "External id": 232852,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749993.708, "dur": 0.265, + "args": { + "External id": 232853,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749995.086, "dur": 0.554, + "args": { + "External id": 232854,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749997.112, "dur": 0.312, + "args": { + "External id": 232855,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115749998.693, "dur": 1.944, + "args": { + "External id": 232856,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115750001.751, "dur": 0.318, + "args": { + "External id": 232857,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115750019.554, "dur": 18.238, + "args": { + "External id": 232858,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115750089.494, "dur": 107.268, + "args": { + "External id": 232859,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115750111.578, "dur": 81.812, + "args": { + "External id": 232860,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2971, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115750120.968, "dur": 68.419, + "args": { + "External id": 232861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115750211.255, "dur": 1.803, + "args": { + "External id": 232862,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2973, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115750286.713, "dur": 1611.928, + "args": { + "External id": 232863,"Sequence number": 2757766, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2974 + } + }, + { + "ph": "f", "id": 190, "pid": 4183442, "tid": 31331, "ts": 667115750286.713, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115750393.942, "dur": 116.875, + "args": { + "External id": 232864,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115750551.361, "dur": 40.086, + "args": { + "External id": 232865,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115750610.508, "dur": 81.359, + "args": { + "External id": 232866,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115750706.289, "dur": 32.511, + "args": { + "External id": 232867,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115750745.325, "dur": 34.983, + "args": { + "External id": 232868,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115750787.072, "dur": 22.490, + "args": { + "External id": 232869,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115750818.706, "dur": 27.974, + "args": { + "External id": 232870,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115750871.544, "dur": 23.341, + "args": { + "External id": 232871,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115750914.457, "dur": 26.721, + "args": { + "External id": 232872,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115750958.426, "dur": 18.878, + "args": { + "External id": 232873,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115750989.264, "dur": 14.382, + "args": { + "External id": 232874,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751013.299, "dur": 37.800, + "args": { + "External id": 232875,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751054.207, "dur": 30.430, + "args": { + "External id": 232876,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115751111.115, "dur": 166.359, + "args": { + "External id": 232877,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115751183.971, "dur": 5.562, + "args": { + "External id": 232878,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115751191.286, "dur": 4.478, + "args": { + "External id": 232879,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115751310.467, "dur": 23.643, + "args": { + "External id": 232880,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115751346.484, "dur": 13.198, + "args": { + "External id": 232881,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751368.706, "dur": 40.565, + "args": { + "External id": 232882,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751414.747, "dur": 30.449, + "args": { + "External id": 232883,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751451.617, "dur": 30.719, + "args": { + "External id": 232884,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751486.744, "dur": 47.221, + "args": { + "External id": 232885,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751548.529, "dur": 29.571, + "args": { + "External id": 232886,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115751584.786, "dur": 28.140, + "args": { + "External id": 232887,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115751629.712, "dur": 57.801, + "args": { + "External id": 232888,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115751712.854, "dur": 47.268, + "args": { + "External id": 232889,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115751781.804, "dur": 19.250, + "args": { + "External id": 232890,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115751821.842, "dur": 13.946, + "args": { + "External id": 232891,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115751848.886, "dur": 17.562, + "args": { + "External id": 232892,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751945.316, "dur": 14.939, + "args": { + "External id": 232893,"Record function id": 0, "Ev Idx": 3004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751948.432, "dur": 10.957, + "args": { + "External id": 232894,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115751952.687, "dur": 5.856, + "args": { + "External id": 232895,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115751954.071, "dur": 4.358, + "args": { + "External id": 232896,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751964.293, "dur": 4.907, + "args": { + "External id": 232897,"Record function id": 0, "Ev Idx": 3008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751965.675, "dur": 3.083, + "args": { + "External id": 232898,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115751966.684, "dur": 1.568, + "args": { + "External id": 232899,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115751967.245, "dur": 0.908, + "args": { + "External id": 232900,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751972.426, "dur": 4.091, + "args": { + "External id": 232901,"Record function id": 0, "Ev Idx": 3012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751973.848, "dur": 2.232, + "args": { + "External id": 232902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115751974.476, "dur": 1.120, + "args": { + "External id": 232903,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115751974.887, "dur": 0.629, + "args": { + "External id": 232904,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751979.722, "dur": 7.905, + "args": { + "External id": 232905,"Record function id": 0, "Ev Idx": 3016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751981.293, "dur": 3.218, + "args": { + "External id": 232906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115751982.395, "dur": 1.478, + "args": { + "External id": 232907,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115751983.110, "dur": 0.670, + "args": { + "External id": 232908,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751990.720, "dur": 4.279, + "args": { + "External id": 232909,"Record function id": 0, "Ev Idx": 3020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751992.007, "dur": 2.575, + "args": { + "External id": 232910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115751992.638, "dur": 1.506, + "args": { + "External id": 232911,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115751993.535, "dur": 0.545, + "args": { + "External id": 232912,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751998.203, "dur": 4.848, + "args": { + "External id": 232913,"Record function id": 0, "Ev Idx": 3024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115751999.615, "dur": 3.026, + "args": { + "External id": 232914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115752000.502, "dur": 1.649, + "args": { + "External id": 232915,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115752001.360, "dur": 0.718, + "args": { + "External id": 232916,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115752006.432, "dur": 5.236, + "args": { + "External id": 232917,"Record function id": 0, "Ev Idx": 3028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115752007.553, "dur": 3.688, + "args": { + "External id": 232918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115752008.120, "dur": 2.688, + "args": { + "External id": 232919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115752008.669, "dur": 2.037, + "args": { + "External id": 232920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115752014.960, "dur": 3.658, + "args": { + "External id": 232921,"Record function id": 0, "Ev Idx": 3032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115752015.893, "dur": 2.318, + "args": { + "External id": 232922,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115752016.390, "dur": 1.411, + "args": { + "External id": 232923,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115752017.013, "dur": 0.718, + "args": { + "External id": 232924,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115752021.769, "dur": 3.647, + "args": { + "External id": 232925,"Record function id": 0, "Ev Idx": 3036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115752022.756, "dur": 2.243, + "args": { + "External id": 232926,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115752023.379, "dur": 1.228, + "args": { + "External id": 232927,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115752023.959, "dur": 0.584, + "args": { + "External id": 232928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115752029.112, "dur": 15186.835, + "args": { + "External id": 232929,"Record function id": 0, "Sequence number": 2757765, "Fwd thread id": 1, "Ev Idx": 3040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115752030.606, "dur": 15175.689, + "args": { + "External id": 232930,"Sequence number": 2757765, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3041 + } + }, + { + "ph": "f", "id": 191, "pid": 4183442, "tid": 31331, "ts": 667115752030.606, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.10)", "pid": 4183442, "tid": 31331, + "ts": 667115752061.195, "dur": 38.031, + "args": { + "External id": 232931,"Record function id": 0, "Ev Idx": 3042 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.10)", "pid": 4183442, "tid": 31331, + "ts": 667115752106.517, "dur": 65.436, + "args": { + "External id": 232932,"Record function id": 0, "Ev Idx": 3043 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.10)", "pid": 4183442, "tid": 31331, + "ts": 667115752178.401, "dur": 15020.659, + "args": { + "External id": 232933,"Record function id": 0, "Ev Idx": 3044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115752258.482, "dur": 6.298, + "args": { + "External id": 232934,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115752273.622, "dur": 4.543, + "args": { + "External id": 232935,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115752291.053, "dur": 14153.904, + "args": { + "External id": 232936,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115752307.571, "dur": 14129.097, + "args": { + "External id": 232937,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115752332.180, "dur": 14.022, + "args": { + "External id": 232938,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115752350.040, "dur": 14049.772, + "args": { + "External id": 232939,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115752352.317, "dur": 14046.686, + "args": { + "External id": 232940,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115752355.964, "dur": 4.862, + "args": { + "External id": 232941,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115752362.441, "dur": 14032.934, + "args": { + "External id": 232942,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115766545.457, "dur": 10.235, + "args": { + "External id": 232943,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115766548.783, "dur": 6.347, + "args": { + "External id": 232944,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115766583.262, "dur": 340.421, + "args": { + "External id": 232945,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115766608.318, "dur": 310.463, + "args": { + "External id": 232946,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3057, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115766619.542, "dur": 294.182, + "args": { + "External id": 232947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115766942.101, "dur": 2.319, + "args": { + "External id": 232948,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3059, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767000.120, "dur": 8.165, + "args": { + "External id": 232949,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767050.774, "dur": 1.467, + "args": { + "External id": 232950,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767067.621, "dur": 1.077, + "args": { + "External id": 232951,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767080.533, "dur": 0.812, + "args": { + "External id": 232952,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767093.247, "dur": 2.498, + "args": { + "External id": 232953,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767105.864, "dur": 0.895, + "args": { + "External id": 232954,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767117.060, "dur": 0.864, + "args": { + "External id": 232955,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767128.520, "dur": 1.527, + "args": { + "External id": 232956,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767139.591, "dur": 2.768, + "args": { + "External id": 232957,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115767229.703, "dur": 2609.978, + "args": { + "External id": 232958,"Record function id": 0, "Ev Idx": 3069 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.9)", "pid": 4183442, "tid": 31331, + "ts": 667115767248.622, "dur": 990.020, + "args": { + "External id": 232959,"Record function id": 0, "Ev Idx": 3070 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 4183442, "tid": 31331, + "ts": 667115767262.985, "dur": 326.062, + "args": { + "External id": 232960,"Record function id": 0, "Ev Idx": 3071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767360.430, "dur": 4.542, + "args": { + "External id": 232961,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767368.405, "dur": 1.059, + "args": { + "External id": 232962,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767371.071, "dur": 1.054, + "args": { + "External id": 232963,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767373.499, "dur": 0.884, + "args": { + "External id": 232964,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767375.618, "dur": 0.787, + "args": { + "External id": 232965,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767377.807, "dur": 1.154, + "args": { + "External id": 232966,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767380.603, "dur": 2.713, + "args": { + "External id": 232967,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767384.862, "dur": 0.707, + "args": { + "External id": 232968,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767387.260, "dur": 0.987, + "args": { + "External id": 232969,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115767389.732, "dur": 0.652, + "args": { + "External id": 232970,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115767406.991, "dur": 152.558, + "args": { + "External id": 232971,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115767421.987, "dur": 132.590, + "args": { + "External id": 232972,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115767435.153, "dur": 11.732, + "args": { + "External id": 232973,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115767450.113, "dur": 78.686, + "args": { + "External id": 232974,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115767452.331, "dur": 76.194, + "args": { + "External id": 232975,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767455.774, "dur": 5.940, + "args": { + "External id": 232976,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115767463.386, "dur": 64.045, + "args": { + "External id": 232977,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3088 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.8", "pid": 4183442, "tid": 31331, + "ts": 667115767709.905, "dur": 521.184, + "args": { + "External id": 232978,"Record function id": 0, "Ev Idx": 3089 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 4183442, "tid": 31331, + "ts": 667115767726.947, "dur": 492.445, + "args": { + "External id": 232979,"Record function id": 0, "Ev Idx": 3090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115767786.498, "dur": 5.399, + "args": { + "External id": 232980,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115767807.003, "dur": 27.651, + "args": { + "External id": 232981,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767811.527, "dur": 1.731, + "args": { + "External id": 232982,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767815.080, "dur": 2.379, + "args": { + "External id": 232983,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767818.602, "dur": 0.539, + "args": { + "External id": 232984,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767820.532, "dur": 0.237, + "args": { + "External id": 232985,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767821.695, "dur": 0.558, + "args": { + "External id": 232986,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767824.062, "dur": 0.356, + "args": { + "External id": 232987,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767826.260, "dur": 0.695, + "args": { + "External id": 232988,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767828.027, "dur": 0.753, + "args": { + "External id": 232989,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767830.141, "dur": 0.552, + "args": { + "External id": 232990,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115767845.004, "dur": 29.846, + "args": { + "External id": 232991,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115767904.158, "dur": 93.563, + "args": { + "External id": 232992,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115767913.771, "dur": 5.237, + "args": { + "External id": 232993,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115767924.026, "dur": 9.664, + "args": { + "External id": 232994,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115767928.182, "dur": 5.117, + "args": { + "External id": 232995,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767931.595, "dur": 0.595, + "args": { + "External id": 232996,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115767939.856, "dur": 21.272, + "args": { + "External id": 232997,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767941.692, "dur": 0.357, + "args": { + "External id": 232998,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767943.357, "dur": 0.353, + "args": { + "External id": 232999,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767944.970, "dur": 0.283, + "args": { + "External id": 233000,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767946.436, "dur": 0.487, + "args": { + "External id": 233001,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767948.432, "dur": 0.498, + "args": { + "External id": 233002,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767950.586, "dur": 0.344, + "args": { + "External id": 233003,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767952.729, "dur": 1.855, + "args": { + "External id": 233004,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767955.916, "dur": 0.289, + "args": { + "External id": 233005,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115767957.452, "dur": 0.618, + "args": { + "External id": 233006,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115767971.394, "dur": 19.487, + "args": { + "External id": 233007,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115768041.128, "dur": 115.754, + "args": { + "External id": 233008,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115768063.659, "dur": 90.225, + "args": { + "External id": 233009,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3120, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115768073.191, "dur": 76.576, + "args": { + "External id": 233010,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115768170.413, "dur": 1.845, + "args": { + "External id": 233011,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3122, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115768246.064, "dur": 1571.535, + "args": { + "External id": 233012,"Sequence number": 2757764, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3123 + } + }, + { + "ph": "f", "id": 192, "pid": 4183442, "tid": 31331, "ts": 667115768246.064, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115768354.184, "dur": 96.271, + "args": { + "External id": 233013,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115768486.253, "dur": 59.844, + "args": { + "External id": 233014,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115768568.979, "dur": 43.246, + "args": { + "External id": 233015,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115768622.179, "dur": 25.971, + "args": { + "External id": 233016,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115768693.515, "dur": 38.581, + "args": { + "External id": 233017,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115768742.361, "dur": 26.122, + "args": { + "External id": 233018,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115768775.987, "dur": 29.483, + "args": { + "External id": 233019,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115768829.219, "dur": 21.343, + "args": { + "External id": 233020,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115768867.825, "dur": 25.952, + "args": { + "External id": 233021,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115768910.695, "dur": 17.673, + "args": { + "External id": 233022,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115768939.245, "dur": 12.573, + "args": { + "External id": 233023,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115768960.866, "dur": 36.068, + "args": { + "External id": 233024,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115769000.145, "dur": 30.548, + "args": { + "External id": 233025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115769056.844, "dur": 164.553, + "args": { + "External id": 233026,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115769131.489, "dur": 5.558, + "args": { + "External id": 233027,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115769138.989, "dur": 3.735, + "args": { + "External id": 233028,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115769255.304, "dur": 22.433, + "args": { + "External id": 233029,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115769289.665, "dur": 13.783, + "args": { + "External id": 233030,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115769310.499, "dur": 44.480, + "args": { + "External id": 233031,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115769360.437, "dur": 33.470, + "args": { + "External id": 233032,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115769399.522, "dur": 27.138, + "args": { + "External id": 233033,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115769432.433, "dur": 28.697, + "args": { + "External id": 233034,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115769466.003, "dur": 45.463, + "args": { + "External id": 233035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115769521.185, "dur": 32.620, + "args": { + "External id": 233036,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115769569.915, "dur": 22.092, + "args": { + "External id": 233037,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115769607.446, "dur": 22.502, + "args": { + "External id": 233038,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115769642.873, "dur": 68.282, + "args": { + "External id": 233039,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115769740.776, "dur": 15.505, + "args": { + "External id": 233040,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115769770.766, "dur": 15.449, + "args": { + "External id": 233041,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769864.881, "dur": 14.719, + "args": { + "External id": 233042,"Record function id": 0, "Ev Idx": 3153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769868.034, "dur": 10.673, + "args": { + "External id": 233043,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769872.094, "dur": 5.612, + "args": { + "External id": 233044,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769873.583, "dur": 4.030, + "args": { + "External id": 233045,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769883.499, "dur": 4.764, + "args": { + "External id": 233046,"Record function id": 0, "Ev Idx": 3157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769884.718, "dur": 3.085, + "args": { + "External id": 233047,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769885.815, "dur": 1.464, + "args": { + "External id": 233048,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769886.334, "dur": 0.862, + "args": { + "External id": 233049,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769891.581, "dur": 4.736, + "args": { + "External id": 233050,"Record function id": 0, "Ev Idx": 3161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769893.026, "dur": 2.864, + "args": { + "External id": 233051,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769894.067, "dur": 1.393, + "args": { + "External id": 233052,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769894.656, "dur": 0.698, + "args": { + "External id": 233053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769899.519, "dur": 8.924, + "args": { + "External id": 233054,"Record function id": 0, "Ev Idx": 3165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769900.844, "dur": 7.171, + "args": { + "External id": 233055,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769901.447, "dur": 6.158, + "args": { + "External id": 233056,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769901.739, "dur": 5.785, + "args": { + "External id": 233057,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769911.561, "dur": 3.922, + "args": { + "External id": 233058,"Record function id": 0, "Ev Idx": 3169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769912.606, "dur": 2.421, + "args": { + "External id": 233059,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769913.152, "dur": 1.500, + "args": { + "External id": 233060,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769913.707, "dur": 0.853, + "args": { + "External id": 233061,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769918.704, "dur": 3.996, + "args": { + "External id": 233062,"Record function id": 0, "Ev Idx": 3173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769919.716, "dur": 2.547, + "args": { + "External id": 233063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769920.340, "dur": 1.403, + "args": { + "External id": 233064,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769920.815, "dur": 0.860, + "args": { + "External id": 233065,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769925.958, "dur": 3.582, + "args": { + "External id": 233066,"Record function id": 0, "Ev Idx": 3177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769927.038, "dur": 2.024, + "args": { + "External id": 233067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769927.549, "dur": 1.089, + "args": { + "External id": 233068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769927.866, "dur": 0.698, + "args": { + "External id": 233069,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769932.563, "dur": 3.808, + "args": { + "External id": 233070,"Record function id": 0, "Ev Idx": 3181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769933.763, "dur": 2.164, + "args": { + "External id": 233071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769934.618, "dur": 0.920, + "args": { + "External id": 233072,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769934.924, "dur": 0.527, + "args": { + "External id": 233073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769939.489, "dur": 3.548, + "args": { + "External id": 233074,"Record function id": 0, "Ev Idx": 3185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115769940.514, "dur": 2.096, + "args": { + "External id": 233075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115769940.993, "dur": 1.074, + "args": { + "External id": 233076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115769941.476, "dur": 0.527, + "args": { + "External id": 233077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115769946.771, "dur": 14977.246, + "args": { + "External id": 233078,"Record function id": 0, "Sequence number": 2757763, "Fwd thread id": 1, "Ev Idx": 3189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115769948.124, "dur": 14966.818, + "args": { + "External id": 233079,"Sequence number": 2757763, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3190 + } + }, + { + "ph": "f", "id": 193, "pid": 4183442, "tid": 31331, "ts": 667115769948.124, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.9)", "pid": 4183442, "tid": 31331, + "ts": 667115769982.231, "dur": 39.563, + "args": { + "External id": 233080,"Record function id": 0, "Ev Idx": 3191 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.9)", "pid": 4183442, "tid": 31331, + "ts": 667115770028.753, "dur": 65.680, + "args": { + "External id": 233081,"Record function id": 0, "Ev Idx": 3192 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.9)", "pid": 4183442, "tid": 31331, + "ts": 667115770100.209, "dur": 14807.220, + "args": { + "External id": 233082,"Record function id": 0, "Ev Idx": 3193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115770186.404, "dur": 6.625, + "args": { + "External id": 233083,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115770202.138, "dur": 4.461, + "args": { + "External id": 233084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115770219.717, "dur": 14004.604, + "args": { + "External id": 233085,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115770236.575, "dur": 13979.549, + "args": { + "External id": 233086,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115770258.770, "dur": 15.229, + "args": { + "External id": 233087,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115770278.762, "dur": 13905.437, + "args": { + "External id": 233088,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115770281.498, "dur": 13901.948, + "args": { + "External id": 233089,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115770285.246, "dur": 4.202, + "args": { + "External id": 233090,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115770290.953, "dur": 13888.800, + "args": { + "External id": 233091,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115784311.287, "dur": 8.759, + "args": { + "External id": 233092,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115784314.018, "dur": 5.704, + "args": { + "External id": 233093,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115784347.225, "dur": 259.001, + "args": { + "External id": 233094,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115784371.300, "dur": 230.366, + "args": { + "External id": 233095,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3206, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115784381.957, "dur": 214.729, + "args": { + "External id": 233096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115784622.798, "dur": 2.094, + "args": { + "External id": 233097,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3208, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784710.639, "dur": 6.286, + "args": { + "External id": 233098,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784760.451, "dur": 1.414, + "args": { + "External id": 233099,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784776.628, "dur": 1.351, + "args": { + "External id": 233100,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784791.491, "dur": 1.002, + "args": { + "External id": 233101,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784802.911, "dur": 0.995, + "args": { + "External id": 233102,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784813.830, "dur": 0.999, + "args": { + "External id": 233103,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784824.900, "dur": 0.804, + "args": { + "External id": 233104,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784837.849, "dur": 1.655, + "args": { + "External id": 233105,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115784848.604, "dur": 0.916, + "args": { + "External id": 233106,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115784939.679, "dur": 2546.242, + "args": { + "External id": 233107,"Record function id": 0, "Ev Idx": 3218 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.8)", "pid": 4183442, "tid": 31331, + "ts": 667115784958.847, "dur": 968.331, + "args": { + "External id": 233108,"Record function id": 0, "Ev Idx": 3219 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 4183442, "tid": 31331, + "ts": 667115784972.547, "dur": 288.802, + "args": { + "External id": 233109,"Record function id": 0, "Ev Idx": 3220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785052.653, "dur": 4.124, + "args": { + "External id": 233110,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785059.785, "dur": 1.168, + "args": { + "External id": 233111,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785062.545, "dur": 1.102, + "args": { + "External id": 233112,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785065.283, "dur": 2.944, + "args": { + "External id": 233113,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785069.858, "dur": 1.111, + "args": { + "External id": 233114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785072.445, "dur": 0.973, + "args": { + "External id": 233115,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785075.027, "dur": 1.605, + "args": { + "External id": 233116,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785077.995, "dur": 1.140, + "args": { + "External id": 233117,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785080.505, "dur": 1.083, + "args": { + "External id": 233118,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115785083.078, "dur": 0.669, + "args": { + "External id": 233119,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115785100.622, "dur": 134.694, + "args": { + "External id": 233120,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115785115.592, "dur": 115.772, + "args": { + "External id": 233121,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115785127.736, "dur": 12.193, + "args": { + "External id": 233122,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115785142.253, "dur": 63.838, + "args": { + "External id": 233123,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115785145.037, "dur": 60.749, + "args": { + "External id": 233124,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785148.456, "dur": 6.818, + "args": { + "External id": 233125,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115785156.973, "dur": 48.121, + "args": { + "External id": 233126,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3237 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.7", "pid": 4183442, "tid": 31331, + "ts": 667115785344.324, "dur": 575.342, + "args": { + "External id": 233127,"Record function id": 0, "Ev Idx": 3238 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 4183442, "tid": 31331, + "ts": 667115785359.354, "dur": 548.684, + "args": { + "External id": 233128,"Record function id": 0, "Ev Idx": 3239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115785415.081, "dur": 4.541, + "args": { + "External id": 233129,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115785433.355, "dur": 23.543, + "args": { + "External id": 233130,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785437.469, "dur": 1.457, + "args": { + "External id": 233131,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785440.502, "dur": 0.549, + "args": { + "External id": 233132,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785442.114, "dur": 0.902, + "args": { + "External id": 233133,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785444.363, "dur": 0.582, + "args": { + "External id": 233134,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785445.887, "dur": 0.307, + "args": { + "External id": 233135,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785447.125, "dur": 0.276, + "args": { + "External id": 233136,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785448.408, "dur": 2.048, + "args": { + "External id": 233137,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785451.578, "dur": 0.398, + "args": { + "External id": 233138,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785452.982, "dur": 0.382, + "args": { + "External id": 233139,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115785466.734, "dur": 49.772, + "args": { + "External id": 233140,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115785550.431, "dur": 95.593, + "args": { + "External id": 233141,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115785560.518, "dur": 4.384, + "args": { + "External id": 233142,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115785569.942, "dur": 9.637, + "args": { + "External id": 233143,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115785573.990, "dur": 5.171, + "args": { + "External id": 233144,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785577.208, "dur": 0.547, + "args": { + "External id": 233145,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115785586.020, "dur": 20.141, + "args": { + "External id": 233146,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785587.539, "dur": 0.537, + "args": { + "External id": 233147,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785589.090, "dur": 0.488, + "args": { + "External id": 233148,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785590.528, "dur": 0.401, + "args": { + "External id": 233149,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785591.792, "dur": 2.534, + "args": { + "External id": 233150,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785595.440, "dur": 0.460, + "args": { + "External id": 233151,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785597.068, "dur": 0.488, + "args": { + "External id": 233152,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785598.569, "dur": 0.544, + "args": { + "External id": 233153,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785600.561, "dur": 0.330, + "args": { + "External id": 233154,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115785602.303, "dur": 0.377, + "args": { + "External id": 233155,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115785616.680, "dur": 22.084, + "args": { + "External id": 233156,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115785731.792, "dur": 109.849, + "args": { + "External id": 233157,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115785754.185, "dur": 84.304, + "args": { + "External id": 233158,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3269, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115785763.509, "dur": 70.761, + "args": { + "External id": 233159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115785856.937, "dur": 1.931, + "args": { + "External id": 233160,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3271, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115785933.859, "dur": 1531.785, + "args": { + "External id": 233161,"Sequence number": 2757762, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3272 + } + }, + { + "ph": "f", "id": 194, "pid": 4183442, "tid": 31331, "ts": 667115785933.859, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786044.424, "dur": 96.758, + "args": { + "External id": 233162,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115786180.819, "dur": 36.301, + "args": { + "External id": 233163,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115786232.921, "dur": 38.599, + "args": { + "External id": 233164,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786280.645, "dur": 25.136, + "args": { + "External id": 233165,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786313.514, "dur": 33.648, + "args": { + "External id": 233166,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786356.524, "dur": 19.762, + "args": { + "External id": 233167,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786382.350, "dur": 28.596, + "args": { + "External id": 233168,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115786432.527, "dur": 20.083, + "args": { + "External id": 233169,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115786469.520, "dur": 46.335, + "args": { + "External id": 233170,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115786538.640, "dur": 20.155, + "args": { + "External id": 233171,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115786571.642, "dur": 14.559, + "args": { + "External id": 233172,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786596.534, "dur": 40.061, + "args": { + "External id": 233173,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786640.026, "dur": 70.403, + "args": { + "External id": 233174,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115786740.334, "dur": 164.338, + "args": { + "External id": 233175,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115786812.221, "dur": 6.011, + "args": { + "External id": 233176,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115786820.061, "dur": 4.589, + "args": { + "External id": 233177,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115786936.416, "dur": 26.871, + "args": { + "External id": 233178,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115786975.578, "dur": 15.118, + "args": { + "External id": 233179,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115786998.461, "dur": 49.606, + "args": { + "External id": 233180,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115787053.946, "dur": 30.952, + "args": { + "External id": 233181,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115787091.211, "dur": 27.924, + "args": { + "External id": 233182,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115787125.861, "dur": 30.559, + "args": { + "External id": 233183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115787162.428, "dur": 27.636, + "args": { + "External id": 233184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115787199.819, "dur": 28.622, + "args": { + "External id": 233185,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115787245.578, "dur": 26.900, + "args": { + "External id": 233186,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115787289.084, "dur": 27.277, + "args": { + "External id": 233187,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115787331.028, "dur": 32.291, + "args": { + "External id": 233188,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115787388.379, "dur": 16.111, + "args": { + "External id": 233189,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115787417.837, "dur": 19.908, + "args": { + "External id": 233190,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787527.874, "dur": 15.876, + "args": { + "External id": 233191,"Record function id": 0, "Ev Idx": 3302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787531.508, "dur": 10.954, + "args": { + "External id": 233192,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787535.535, "dur": 5.573, + "args": { + "External id": 233193,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787536.821, "dur": 4.087, + "args": { + "External id": 233194,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787550.483, "dur": 6.180, + "args": { + "External id": 233195,"Record function id": 0, "Ev Idx": 3306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787552.039, "dur": 4.155, + "args": { + "External id": 233196,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787553.561, "dur": 2.064, + "args": { + "External id": 233197,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787554.128, "dur": 1.424, + "args": { + "External id": 233198,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787560.084, "dur": 4.068, + "args": { + "External id": 233199,"Record function id": 0, "Ev Idx": 3310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787561.241, "dur": 2.440, + "args": { + "External id": 233200,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787561.914, "dur": 1.348, + "args": { + "External id": 233201,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787562.290, "dur": 0.883, + "args": { + "External id": 233202,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787567.417, "dur": 4.067, + "args": { + "External id": 233203,"Record function id": 0, "Ev Idx": 3314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787568.974, "dur": 2.106, + "args": { + "External id": 233204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787569.612, "dur": 1.044, + "args": { + "External id": 233205,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787569.883, "dur": 0.694, + "args": { + "External id": 233206,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787574.530, "dur": 6.157, + "args": { + "External id": 233207,"Record function id": 0, "Ev Idx": 3318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787575.896, "dur": 4.301, + "args": { + "External id": 233208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787576.354, "dur": 3.396, + "args": { + "External id": 233209,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787576.955, "dur": 2.733, + "args": { + "External id": 233210,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787583.901, "dur": 5.115, + "args": { + "External id": 233211,"Record function id": 0, "Ev Idx": 3322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787585.556, "dur": 3.009, + "args": { + "External id": 233212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787586.278, "dur": 1.751, + "args": { + "External id": 233213,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787587.050, "dur": 0.918, + "args": { + "External id": 233214,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787592.402, "dur": 4.036, + "args": { + "External id": 233215,"Record function id": 0, "Ev Idx": 3326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787593.641, "dur": 2.381, + "args": { + "External id": 233216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787594.138, "dur": 1.477, + "args": { + "External id": 233217,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787594.898, "dur": 0.652, + "args": { + "External id": 233218,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787599.675, "dur": 4.220, + "args": { + "External id": 233219,"Record function id": 0, "Ev Idx": 3330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787600.699, "dur": 2.780, + "args": { + "External id": 233220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787601.151, "dur": 1.910, + "args": { + "External id": 233221,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787602.254, "dur": 0.747, + "args": { + "External id": 233222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787609.802, "dur": 3.830, + "args": { + "External id": 233223,"Record function id": 0, "Ev Idx": 3334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115787610.763, "dur": 2.430, + "args": { + "External id": 233224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115787611.230, "dur": 1.561, + "args": { + "External id": 233225,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115787612.113, "dur": 0.612, + "args": { + "External id": 233226,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115787617.254, "dur": 16540.891, + "args": { + "External id": 233227,"Record function id": 0, "Sequence number": 2757761, "Fwd thread id": 1, "Ev Idx": 3338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115787618.783, "dur": 16531.084, + "args": { + "External id": 233228,"Sequence number": 2757761, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3339 + } + }, + { + "ph": "f", "id": 195, "pid": 4183442, "tid": 31331, "ts": 667115787618.783, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.8)", "pid": 4183442, "tid": 31331, + "ts": 667115787649.231, "dur": 78.266, + "args": { + "External id": 233229,"Record function id": 0, "Ev Idx": 3340 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.8)", "pid": 4183442, "tid": 31331, + "ts": 667115787736.011, "dur": 64.255, + "args": { + "External id": 233230,"Record function id": 0, "Ev Idx": 3341 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.8)", "pid": 4183442, "tid": 31331, + "ts": 667115787805.963, "dur": 16336.226, + "args": { + "External id": 233231,"Record function id": 0, "Ev Idx": 3342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115787891.668, "dur": 7.128, + "args": { + "External id": 233232,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115787908.151, "dur": 4.984, + "args": { + "External id": 233233,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115787929.530, "dur": 15465.952, + "args": { + "External id": 233234,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115787942.628, "dur": 15445.259, + "args": { + "External id": 233235,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115787966.507, "dur": 17.118, + "args": { + "External id": 233236,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115787987.352, "dur": 15361.996, + "args": { + "External id": 233237,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115787989.585, "dur": 15358.995, + "args": { + "External id": 233238,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115787994.057, "dur": 6.292, + "args": { + "External id": 233239,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115788001.927, "dur": 15343.304, + "args": { + "External id": 233240,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115803481.202, "dur": 9.039, + "args": { + "External id": 233241,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115803484.092, "dur": 5.799, + "args": { + "External id": 233242,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115803530.025, "dur": 331.218, + "args": { + "External id": 233243,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115803556.917, "dur": 299.390, + "args": { + "External id": 233244,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3355, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115803567.823, "dur": 283.504, + "args": { + "External id": 233245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115803881.049, "dur": 2.206, + "args": { + "External id": 233246,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3357, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115803941.739, "dur": 6.267, + "args": { + "External id": 233247,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115803990.014, "dur": 1.520, + "args": { + "External id": 233248,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804006.950, "dur": 1.667, + "args": { + "External id": 233249,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804020.062, "dur": 2.802, + "args": { + "External id": 233250,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804033.524, "dur": 1.010, + "args": { + "External id": 233251,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804044.769, "dur": 0.846, + "args": { + "External id": 233252,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804056.548, "dur": 0.886, + "args": { + "External id": 233253,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804068.386, "dur": 3.202, + "args": { + "External id": 233254,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804081.527, "dur": 0.815, + "args": { + "External id": 233255,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115804171.708, "dur": 2608.147, + "args": { + "External id": 233256,"Record function id": 0, "Ev Idx": 3367 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.7)", "pid": 4183442, "tid": 31331, + "ts": 667115804191.717, "dur": 990.911, + "args": { + "External id": 233257,"Record function id": 0, "Ev Idx": 3368 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 4183442, "tid": 31331, + "ts": 667115804206.227, "dur": 312.383, + "args": { + "External id": 233258,"Record function id": 0, "Ev Idx": 3369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804284.427, "dur": 4.148, + "args": { + "External id": 233259,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804291.657, "dur": 1.256, + "args": { + "External id": 233260,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804294.639, "dur": 1.212, + "args": { + "External id": 233261,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804297.546, "dur": 1.030, + "args": { + "External id": 233262,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804300.242, "dur": 2.944, + "args": { + "External id": 233263,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804305.142, "dur": 1.067, + "args": { + "External id": 233264,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804308.212, "dur": 1.634, + "args": { + "External id": 233265,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804311.822, "dur": 1.093, + "args": { + "External id": 233266,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804314.931, "dur": 1.197, + "args": { + "External id": 233267,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115804318.074, "dur": 1.074, + "args": { + "External id": 233268,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115804336.094, "dur": 135.209, + "args": { + "External id": 233269,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115804351.967, "dur": 115.265, + "args": { + "External id": 233270,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115804364.190, "dur": 14.293, + "args": { + "External id": 233271,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115804380.906, "dur": 59.322, + "args": { + "External id": 233272,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115804383.933, "dur": 56.004, + "args": { + "External id": 233273,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804387.832, "dur": 5.350, + "args": { + "External id": 233274,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115804394.845, "dur": 44.541, + "args": { + "External id": 233275,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3386 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.6", "pid": 4183442, "tid": 31331, + "ts": 667115804607.714, "dur": 566.211, + "args": { + "External id": 233276,"Record function id": 0, "Ev Idx": 3387 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 4183442, "tid": 31331, + "ts": 667115804625.680, "dur": 535.825, + "args": { + "External id": 233277,"Record function id": 0, "Ev Idx": 3388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115804723.543, "dur": 8.095, + "args": { + "External id": 233278,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115804747.408, "dur": 29.073, + "args": { + "External id": 233279,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804752.291, "dur": 1.667, + "args": { + "External id": 233280,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804755.701, "dur": 0.773, + "args": { + "External id": 233281,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804758.335, "dur": 0.564, + "args": { + "External id": 233282,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804760.762, "dur": 0.304, + "args": { + "External id": 233283,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804762.275, "dur": 0.247, + "args": { + "External id": 233284,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804763.934, "dur": 0.600, + "args": { + "External id": 233285,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804766.151, "dur": 0.913, + "args": { + "External id": 233286,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804768.531, "dur": 1.746, + "args": { + "External id": 233287,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804771.550, "dur": 0.640, + "args": { + "External id": 233288,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115804787.059, "dur": 33.117, + "args": { + "External id": 233289,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115804852.381, "dur": 93.289, + "args": { + "External id": 233290,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115804862.034, "dur": 3.310, + "args": { + "External id": 233291,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115804870.376, "dur": 9.164, + "args": { + "External id": 233292,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115804874.334, "dur": 4.800, + "args": { + "External id": 233293,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804877.553, "dur": 0.468, + "args": { + "External id": 233294,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115804886.213, "dur": 23.435, + "args": { + "External id": 233295,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804888.197, "dur": 0.826, + "args": { + "External id": 233296,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804890.836, "dur": 0.492, + "args": { + "External id": 233297,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804893.213, "dur": 0.608, + "args": { + "External id": 233298,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804894.851, "dur": 0.540, + "args": { + "External id": 233299,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804896.937, "dur": 2.298, + "args": { + "External id": 233300,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804900.430, "dur": 0.526, + "args": { + "External id": 233301,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804902.462, "dur": 0.373, + "args": { + "External id": 233302,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804904.148, "dur": 0.405, + "args": { + "External id": 233303,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115804906.714, "dur": 0.347, + "args": { + "External id": 233304,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115804918.993, "dur": 19.246, + "args": { + "External id": 233305,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115804989.804, "dur": 108.642, + "args": { + "External id": 233306,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115805012.751, "dur": 82.395, + "args": { + "External id": 233307,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3418, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115805022.169, "dur": 68.989, + "args": { + "External id": 233308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115805112.592, "dur": 1.874, + "args": { + "External id": 233309,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3420, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115805190.945, "dur": 1562.968, + "args": { + "External id": 233310,"Sequence number": 2757760, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3421 + } + }, + { + "ph": "f", "id": 196, "pid": 4183442, "tid": 31331, "ts": 667115805190.945, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115805298.664, "dur": 97.341, + "args": { + "External id": 233311,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115805435.807, "dur": 36.506, + "args": { + "External id": 233312,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115805488.741, "dur": 67.202, + "args": { + "External id": 233313,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115805568.162, "dur": 37.479, + "args": { + "External id": 233314,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115805611.698, "dur": 34.527, + "args": { + "External id": 233315,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115805690.942, "dur": 26.355, + "args": { + "External id": 233316,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115805725.445, "dur": 29.657, + "args": { + "External id": 233317,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115805782.323, "dur": 23.448, + "args": { + "External id": 233318,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115805824.294, "dur": 26.170, + "args": { + "External id": 233319,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115805868.846, "dur": 17.965, + "args": { + "External id": 233320,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115805899.459, "dur": 13.827, + "args": { + "External id": 233321,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115805923.817, "dur": 36.019, + "args": { + "External id": 233322,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115805963.088, "dur": 30.289, + "args": { + "External id": 233323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115806022.041, "dur": 162.225, + "args": { + "External id": 233324,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115806096.074, "dur": 6.033, + "args": { + "External id": 233325,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115806103.952, "dur": 2.748, + "args": { + "External id": 233326,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115806214.575, "dur": 23.774, + "args": { + "External id": 233327,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115806249.336, "dur": 12.863, + "args": { + "External id": 233328,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115806269.490, "dur": 40.033, + "args": { + "External id": 233329,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115806316.483, "dur": 31.156, + "args": { + "External id": 233330,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115806353.163, "dur": 27.260, + "args": { + "External id": 233331,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115806384.482, "dur": 27.985, + "args": { + "External id": 233332,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115806417.671, "dur": 26.175, + "args": { + "External id": 233333,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115806452.236, "dur": 27.569, + "args": { + "External id": 233334,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115806511.502, "dur": 24.022, + "args": { + "External id": 233335,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115806553.506, "dur": 22.444, + "args": { + "External id": 233336,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115806589.110, "dur": 15.722, + "args": { + "External id": 233337,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115806618.592, "dur": 13.435, + "args": { + "External id": 233338,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115806696.302, "dur": 26.584, + "args": { + "External id": 233339,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806801.101, "dur": 14.803, + "args": { + "External id": 233340,"Record function id": 0, "Ev Idx": 3451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806804.267, "dur": 10.744, + "args": { + "External id": 233341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806808.767, "dur": 5.471, + "args": { + "External id": 233342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806810.132, "dur": 3.991, + "args": { + "External id": 233343,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806819.763, "dur": 5.284, + "args": { + "External id": 233344,"Record function id": 0, "Ev Idx": 3455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806821.074, "dur": 3.502, + "args": { + "External id": 233345,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806822.379, "dur": 1.608, + "args": { + "External id": 233346,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806823.068, "dur": 0.849, + "args": { + "External id": 233347,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806828.656, "dur": 9.749, + "args": { + "External id": 233348,"Record function id": 0, "Ev Idx": 3459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806830.021, "dur": 7.904, + "args": { + "External id": 233349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806831.352, "dur": 6.074, + "args": { + "External id": 233350,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806835.233, "dur": 2.080, + "args": { + "External id": 233351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806841.845, "dur": 4.238, + "args": { + "External id": 233352,"Record function id": 0, "Ev Idx": 3463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806843.097, "dur": 2.536, + "args": { + "External id": 233353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806843.985, "dur": 1.219, + "args": { + "External id": 233354,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806844.254, "dur": 0.838, + "args": { + "External id": 233355,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806849.192, "dur": 4.159, + "args": { + "External id": 233356,"Record function id": 0, "Ev Idx": 3467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806850.381, "dur": 2.537, + "args": { + "External id": 233357,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806851.323, "dur": 1.166, + "args": { + "External id": 233358,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806851.710, "dur": 0.712, + "args": { + "External id": 233359,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806856.416, "dur": 3.908, + "args": { + "External id": 233360,"Record function id": 0, "Ev Idx": 3471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806857.734, "dur": 2.131, + "args": { + "External id": 233361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806858.342, "dur": 1.116, + "args": { + "External id": 233362,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806858.861, "dur": 0.532, + "args": { + "External id": 233363,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806863.524, "dur": 3.825, + "args": { + "External id": 233364,"Record function id": 0, "Ev Idx": 3475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806864.596, "dur": 2.311, + "args": { + "External id": 233365,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806865.125, "dur": 1.234, + "args": { + "External id": 233366,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806865.628, "dur": 0.627, + "args": { + "External id": 233367,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806870.373, "dur": 3.758, + "args": { + "External id": 233368,"Record function id": 0, "Ev Idx": 3479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806871.526, "dur": 2.199, + "args": { + "External id": 233369,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806872.424, "dur": 0.892, + "args": { + "External id": 233370,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806872.722, "dur": 0.531, + "args": { + "External id": 233371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806877.168, "dur": 3.725, + "args": { + "External id": 233372,"Record function id": 0, "Ev Idx": 3483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115806878.509, "dur": 1.964, + "args": { + "External id": 233373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115806879.146, "dur": 0.905, + "args": { + "External id": 233374,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115806879.433, "dur": 0.545, + "args": { + "External id": 233375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115806884.916, "dur": 15095.755, + "args": { + "External id": 233376,"Record function id": 0, "Sequence number": 2757759, "Fwd thread id": 1, "Ev Idx": 3487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115806886.126, "dur": 15086.290, + "args": { + "External id": 233377,"Sequence number": 2757759, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3488 + } + }, + { + "ph": "f", "id": 197, "pid": 4183442, "tid": 31331, "ts": 667115806886.126, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.7)", "pid": 4183442, "tid": 31331, + "ts": 667115806917.593, "dur": 37.156, + "args": { + "External id": 233378,"Record function id": 0, "Ev Idx": 3489 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.7)", "pid": 4183442, "tid": 31331, + "ts": 667115806961.709, "dur": 70.166, + "args": { + "External id": 233379,"Record function id": 0, "Ev Idx": 3490 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.7)", "pid": 4183442, "tid": 31331, + "ts": 667115807037.695, "dur": 14927.769, + "args": { + "External id": 233380,"Record function id": 0, "Ev Idx": 3491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115807120.407, "dur": 10.578, + "args": { + "External id": 233381,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115807140.315, "dur": 5.982, + "args": { + "External id": 233382,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115807159.577, "dur": 14128.372, + "args": { + "External id": 233383,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115807173.578, "dur": 14106.706, + "args": { + "External id": 233384,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115807198.081, "dur": 12.989, + "args": { + "External id": 233385,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115807215.178, "dur": 14032.508, + "args": { + "External id": 233386,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115807217.395, "dur": 14029.493, + "args": { + "External id": 233387,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115807220.896, "dur": 4.502, + "args": { + "External id": 233388,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115807227.169, "dur": 14016.284, + "args": { + "External id": 233389,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115821370.608, "dur": 9.164, + "args": { + "External id": 233390,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115821373.653, "dur": 5.838, + "args": { + "External id": 233391,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115821405.418, "dur": 293.100, + "args": { + "External id": 233392,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115821430.026, "dur": 263.720, + "args": { + "External id": 233393,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3504, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115821440.872, "dur": 247.131, + "args": { + "External id": 233394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115821716.582, "dur": 2.630, + "args": { + "External id": 233395,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3506, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821771.166, "dur": 6.224, + "args": { + "External id": 233396,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821822.036, "dur": 1.332, + "args": { + "External id": 233397,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821838.135, "dur": 1.346, + "args": { + "External id": 233398,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821850.606, "dur": 1.897, + "args": { + "External id": 233399,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821862.724, "dur": 0.769, + "args": { + "External id": 233400,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821873.472, "dur": 0.845, + "args": { + "External id": 233401,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821884.765, "dur": 0.995, + "args": { + "External id": 233402,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821896.298, "dur": 3.284, + "args": { + "External id": 233403,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115821909.028, "dur": 1.105, + "args": { + "External id": 233404,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115821995.027, "dur": 2564.051, + "args": { + "External id": 233405,"Record function id": 0, "Ev Idx": 3516 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.6)", "pid": 4183442, "tid": 31331, + "ts": 667115822014.031, "dur": 955.367, + "args": { + "External id": 233406,"Record function id": 0, "Ev Idx": 3517 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 4183442, "tid": 31331, + "ts": 667115822027.527, "dur": 280.576, + "args": { + "External id": 233407,"Record function id": 0, "Ev Idx": 3518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822104.094, "dur": 4.417, + "args": { + "External id": 233408,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822111.837, "dur": 1.175, + "args": { + "External id": 233409,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822115.327, "dur": 1.094, + "args": { + "External id": 233410,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822118.132, "dur": 1.114, + "args": { + "External id": 233411,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822121.117, "dur": 2.102, + "args": { + "External id": 233412,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822124.795, "dur": 0.717, + "args": { + "External id": 233413,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822127.570, "dur": 1.443, + "args": { + "External id": 233414,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822130.765, "dur": 1.040, + "args": { + "External id": 233415,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822133.405, "dur": 0.942, + "args": { + "External id": 233416,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115822136.055, "dur": 0.931, + "args": { + "External id": 233417,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115822153.895, "dur": 130.054, + "args": { + "External id": 233418,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115822168.157, "dur": 111.912, + "args": { + "External id": 233419,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115822180.128, "dur": 12.953, + "args": { + "External id": 233420,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115822195.662, "dur": 60.347, + "args": { + "External id": 233421,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115822198.245, "dur": 57.420, + "args": { + "External id": 233422,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822201.848, "dur": 5.410, + "args": { + "External id": 233423,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115822209.063, "dur": 46.003, + "args": { + "External id": 233424,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3535 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.5", "pid": 4183442, "tid": 31331, + "ts": 667115822384.880, "dur": 577.230, + "args": { + "External id": 233425,"Record function id": 0, "Ev Idx": 3536 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 4183442, "tid": 31331, + "ts": 667115822400.142, "dur": 550.521, + "args": { + "External id": 233426,"Record function id": 0, "Ev Idx": 3537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115822456.526, "dur": 5.817, + "args": { + "External id": 233427,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115822476.750, "dur": 45.757, + "args": { + "External id": 233428,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822480.996, "dur": 1.163, + "args": { + "External id": 233429,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822483.941, "dur": 0.301, + "args": { + "External id": 233430,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822485.630, "dur": 0.452, + "args": { + "External id": 233431,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822487.701, "dur": 0.312, + "args": { + "External id": 233432,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822489.181, "dur": 0.740, + "args": { + "External id": 233433,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822510.217, "dur": 0.758, + "args": { + "External id": 233434,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822513.230, "dur": 0.568, + "args": { + "External id": 233435,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822515.527, "dur": 1.839, + "args": { + "External id": 233436,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822518.325, "dur": 0.938, + "args": { + "External id": 233437,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115822533.446, "dur": 33.482, + "args": { + "External id": 233438,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115822597.477, "dur": 140.327, + "args": { + "External id": 233439,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115822607.690, "dur": 3.971, + "args": { + "External id": 233440,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115822618.125, "dur": 9.617, + "args": { + "External id": 233441,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115822622.282, "dur": 5.060, + "args": { + "External id": 233442,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822625.673, "dur": 0.559, + "args": { + "External id": 233443,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115822636.872, "dur": 58.534, + "args": { + "External id": 233444,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822638.717, "dur": 0.352, + "args": { + "External id": 233445,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822640.554, "dur": 0.573, + "args": { + "External id": 233446,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822642.343, "dur": 0.525, + "args": { + "External id": 233447,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822644.107, "dur": 0.412, + "args": { + "External id": 233448,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822645.736, "dur": 1.893, + "args": { + "External id": 233449,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822648.600, "dur": 0.799, + "args": { + "External id": 233450,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822650.502, "dur": 34.944, + "args": { + "External id": 233451,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822688.278, "dur": 0.595, + "args": { + "External id": 233452,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115822689.979, "dur": 0.643, + "args": { + "External id": 233453,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115822706.659, "dur": 23.457, + "args": { + "External id": 233454,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115822784.363, "dur": 104.517, + "args": { + "External id": 233455,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115822806.382, "dur": 79.190, + "args": { + "External id": 233456,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3567, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115822815.339, "dur": 66.464, + "args": { + "External id": 233457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115822901.363, "dur": 1.902, + "args": { + "External id": 233458,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3569, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115822977.163, "dur": 1557.928, + "args": { + "External id": 233459,"Sequence number": 2757758, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3570 + } + }, + { + "ph": "f", "id": 198, "pid": 4183442, "tid": 31331, "ts": 667115822977.163, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115823087.473, "dur": 96.275, + "args": { + "External id": 233460,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115823221.065, "dur": 37.391, + "args": { + "External id": 233461,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115823273.799, "dur": 40.024, + "args": { + "External id": 233462,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115823322.904, "dur": 26.795, + "args": { + "External id": 233463,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115823355.009, "dur": 32.521, + "args": { + "External id": 233464,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115823394.178, "dur": 21.503, + "args": { + "External id": 233465,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115823422.635, "dur": 28.903, + "args": { + "External id": 233466,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115823472.933, "dur": 44.550, + "args": { + "External id": 233467,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115823537.429, "dur": 29.249, + "args": { + "External id": 233468,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115823586.127, "dur": 20.383, + "args": { + "External id": 233469,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115823618.435, "dur": 14.627, + "args": { + "External id": 233470,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115823643.052, "dur": 83.688, + "args": { + "External id": 233471,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115823732.686, "dur": 33.163, + "args": { + "External id": 233472,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115823812.847, "dur": 167.313, + "args": { + "External id": 233473,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115823887.430, "dur": 6.145, + "args": { + "External id": 233474,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115823895.233, "dur": 2.586, + "args": { + "External id": 233475,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115824012.725, "dur": 25.652, + "args": { + "External id": 233476,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115824049.387, "dur": 14.576, + "args": { + "External id": 233477,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115824072.965, "dur": 44.595, + "args": { + "External id": 233478,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115824124.346, "dur": 31.059, + "args": { + "External id": 233479,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115824161.316, "dur": 28.107, + "args": { + "External id": 233480,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115824194.064, "dur": 28.433, + "args": { + "External id": 233481,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115824227.691, "dur": 27.089, + "args": { + "External id": 233482,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115824262.487, "dur": 28.620, + "args": { + "External id": 233483,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115824307.135, "dur": 21.366, + "args": { + "External id": 233484,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115824349.463, "dur": 24.400, + "args": { + "External id": 233485,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115824387.804, "dur": 16.423, + "args": { + "External id": 233486,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115824420.121, "dur": 14.977, + "args": { + "External id": 233487,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115824445.816, "dur": 32.300, + "args": { + "External id": 233488,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824582.580, "dur": 17.320, + "args": { + "External id": 233489,"Record function id": 0, "Ev Idx": 3600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824585.894, "dur": 13.198, + "args": { + "External id": 233490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824589.941, "dur": 8.359, + "args": { + "External id": 233491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824594.246, "dur": 3.963, + "args": { + "External id": 233492,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824603.568, "dur": 5.082, + "args": { + "External id": 233493,"Record function id": 0, "Ev Idx": 3604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824605.133, "dur": 3.062, + "args": { + "External id": 233494,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824606.119, "dur": 1.614, + "args": { + "External id": 233495,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824606.684, "dur": 0.946, + "args": { + "External id": 233496,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824611.992, "dur": 5.167, + "args": { + "External id": 233497,"Record function id": 0, "Ev Idx": 3608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824613.657, "dur": 3.033, + "args": { + "External id": 233498,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824614.966, "dur": 1.318, + "args": { + "External id": 233499,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824615.406, "dur": 0.764, + "args": { + "External id": 233500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824620.269, "dur": 6.620, + "args": { + "External id": 233501,"Record function id": 0, "Ev Idx": 3612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824621.677, "dur": 4.767, + "args": { + "External id": 233502,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824622.475, "dur": 3.400, + "args": { + "External id": 233503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824622.789, "dur": 2.984, + "args": { + "External id": 233504,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824629.986, "dur": 4.267, + "args": { + "External id": 233505,"Record function id": 0, "Ev Idx": 3616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824631.450, "dur": 2.339, + "args": { + "External id": 233506,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824632.172, "dur": 1.214, + "args": { + "External id": 233507,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824632.536, "dur": 0.785, + "args": { + "External id": 233508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824637.255, "dur": 4.734, + "args": { + "External id": 233509,"Record function id": 0, "Ev Idx": 3620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824638.739, "dur": 2.814, + "args": { + "External id": 233510,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824639.463, "dur": 1.673, + "args": { + "External id": 233511,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824640.169, "dur": 0.900, + "args": { + "External id": 233512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824645.134, "dur": 40.695, + "args": { + "External id": 233513,"Record function id": 0, "Ev Idx": 3624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824646.610, "dur": 2.410, + "args": { + "External id": 233514,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824647.324, "dur": 1.265, + "args": { + "External id": 233515,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824647.840, "dur": 0.682, + "args": { + "External id": 233516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824692.012, "dur": 6.174, + "args": { + "External id": 233517,"Record function id": 0, "Ev Idx": 3628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824694.068, "dur": 3.671, + "args": { + "External id": 233518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824695.246, "dur": 1.554, + "args": { + "External id": 233519,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824695.697, "dur": 1.029, + "args": { + "External id": 233520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824701.253, "dur": 4.030, + "args": { + "External id": 233521,"Record function id": 0, "Ev Idx": 3632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115824702.670, "dur": 2.160, + "args": { + "External id": 233522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115824703.241, "dur": 1.198, + "args": { + "External id": 233523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115824703.754, "dur": 0.612, + "args": { + "External id": 233524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115824709.261, "dur": 14895.216, + "args": { + "External id": 233525,"Record function id": 0, "Sequence number": 2757757, "Fwd thread id": 1, "Ev Idx": 3636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115824710.743, "dur": 14884.664, + "args": { + "External id": 233526,"Sequence number": 2757757, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3637 + } + }, + { + "ph": "f", "id": 199, "pid": 4183442, "tid": 31331, "ts": 667115824710.743, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.6)", "pid": 4183442, "tid": 31331, + "ts": 667115824742.414, "dur": 42.357, + "args": { + "External id": 233527,"Record function id": 0, "Ev Idx": 3638 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.6)", "pid": 4183442, "tid": 31331, + "ts": 667115824792.056, "dur": 69.727, + "args": { + "External id": 233528,"Record function id": 0, "Ev Idx": 3639 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.6)", "pid": 4183442, "tid": 31331, + "ts": 667115824867.729, "dur": 14720.391, + "args": { + "External id": 233529,"Record function id": 0, "Ev Idx": 3640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115824956.014, "dur": 6.846, + "args": { + "External id": 233530,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115824972.542, "dur": 8.405, + "args": { + "External id": 233531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115824994.682, "dur": 13936.693, + "args": { + "External id": 233532,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115825007.832, "dur": 13915.750, + "args": { + "External id": 233533,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115825031.796, "dur": 15.427, + "args": { + "External id": 233534,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115825051.197, "dur": 13837.867, + "args": { + "External id": 233535,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115825053.741, "dur": 13834.569, + "args": { + "External id": 233536,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115825057.460, "dur": 4.946, + "args": { + "External id": 233537,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115825064.057, "dur": 13820.946, + "args": { + "External id": 233538,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115839018.404, "dur": 9.089, + "args": { + "External id": 233539,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115839021.173, "dur": 5.991, + "args": { + "External id": 233540,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115839055.782, "dur": 241.594, + "args": { + "External id": 233541,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115839080.469, "dur": 212.606, + "args": { + "External id": 233542,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3653, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115839090.901, "dur": 197.895, + "args": { + "External id": 233543,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115839311.751, "dur": 2.152, + "args": { + "External id": 233544,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3655, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839361.788, "dur": 5.743, + "args": { + "External id": 233545,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839411.108, "dur": 1.256, + "args": { + "External id": 233546,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839428.256, "dur": 1.610, + "args": { + "External id": 233547,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839442.100, "dur": 3.141, + "args": { + "External id": 233548,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839455.353, "dur": 0.911, + "args": { + "External id": 233549,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839466.444, "dur": 0.855, + "args": { + "External id": 233550,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839478.572, "dur": 0.936, + "args": { + "External id": 233551,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839509.264, "dur": 3.564, + "args": { + "External id": 233552,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839527.628, "dur": 0.951, + "args": { + "External id": 233553,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115839619.809, "dur": 2558.871, + "args": { + "External id": 233554,"Record function id": 0, "Ev Idx": 3665 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.5)", "pid": 4183442, "tid": 31331, + "ts": 667115839640.002, "dur": 971.835, + "args": { + "External id": 233555,"Record function id": 0, "Ev Idx": 3666 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 4183442, "tid": 31331, + "ts": 667115839691.367, "dur": 301.316, + "args": { + "External id": 233556,"Record function id": 0, "Ev Idx": 3667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839780.253, "dur": 4.556, + "args": { + "External id": 233557,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839788.319, "dur": 1.167, + "args": { + "External id": 233558,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839791.319, "dur": 0.886, + "args": { + "External id": 233559,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839793.810, "dur": 0.972, + "args": { + "External id": 233560,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839796.315, "dur": 2.295, + "args": { + "External id": 233561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839800.048, "dur": 1.249, + "args": { + "External id": 233562,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839802.982, "dur": 1.166, + "args": { + "External id": 233563,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839805.804, "dur": 1.386, + "args": { + "External id": 233564,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839808.688, "dur": 0.973, + "args": { + "External id": 233565,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115839811.029, "dur": 1.148, + "args": { + "External id": 233566,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115839829.803, "dur": 135.380, + "args": { + "External id": 233567,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115839845.321, "dur": 115.572, + "args": { + "External id": 233568,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115839856.800, "dur": 13.005, + "args": { + "External id": 233569,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115839872.357, "dur": 60.663, + "args": { + "External id": 233570,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115839874.601, "dur": 58.159, + "args": { + "External id": 233571,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115839878.047, "dur": 5.494, + "args": { + "External id": 233572,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115839885.238, "dur": 46.896, + "args": { + "External id": 233573,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3684 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.4", "pid": 4183442, "tid": 31331, + "ts": 667115840078.715, "dur": 526.322, + "args": { + "External id": 233574,"Record function id": 0, "Ev Idx": 3685 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 4183442, "tid": 31331, + "ts": 667115840095.272, "dur": 497.636, + "args": { + "External id": 233575,"Record function id": 0, "Ev Idx": 3686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115840152.490, "dur": 6.118, + "args": { + "External id": 233576,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115840173.741, "dur": 24.267, + "args": { + "External id": 233577,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840178.265, "dur": 1.361, + "args": { + "External id": 233578,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840181.539, "dur": 0.653, + "args": { + "External id": 233579,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840183.184, "dur": 0.861, + "args": { + "External id": 233580,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840185.440, "dur": 0.573, + "args": { + "External id": 233581,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840187.044, "dur": 0.346, + "args": { + "External id": 233582,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840188.377, "dur": 0.352, + "args": { + "External id": 233583,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840189.893, "dur": 0.357, + "args": { + "External id": 233584,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840191.541, "dur": 1.963, + "args": { + "External id": 233585,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840194.370, "dur": 0.374, + "args": { + "External id": 233586,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115840207.064, "dur": 30.504, + "args": { + "External id": 233587,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115840265.206, "dur": 91.199, + "args": { + "External id": 233588,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115840274.173, "dur": 3.053, + "args": { + "External id": 233589,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115840281.664, "dur": 9.919, + "args": { + "External id": 233590,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115840285.628, "dur": 5.559, + "args": { + "External id": 233591,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840288.975, "dur": 0.630, + "args": { + "External id": 233592,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115840297.397, "dur": 23.332, + "args": { + "External id": 233593,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840298.763, "dur": 0.594, + "args": { + "External id": 233594,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840300.807, "dur": 0.873, + "args": { + "External id": 233595,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840303.054, "dur": 0.421, + "args": { + "External id": 233596,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840304.590, "dur": 0.689, + "args": { + "External id": 233597,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840306.374, "dur": 1.317, + "args": { + "External id": 233598,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840308.900, "dur": 0.519, + "args": { + "External id": 233599,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840310.543, "dur": 0.377, + "args": { + "External id": 233600,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840311.929, "dur": 0.810, + "args": { + "External id": 233601,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115840314.008, "dur": 0.456, + "args": { + "External id": 233602,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115840329.470, "dur": 19.770, + "args": { + "External id": 233603,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115840398.463, "dur": 126.817, + "args": { + "External id": 233604,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115840420.459, "dur": 100.992, + "args": { + "External id": 233605,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3716, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115840429.100, "dur": 87.348, + "args": { + "External id": 233606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115840541.032, "dur": 2.165, + "args": { + "External id": 233607,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3718, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115840618.803, "dur": 1538.663, + "args": { + "External id": 233608,"Sequence number": 2757756, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3719 + } + }, + { + "ph": "f", "id": 200, "pid": 4183442, "tid": 31331, "ts": 667115840618.803, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115840768.949, "dur": 102.531, + "args": { + "External id": 233609,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115840911.223, "dur": 37.605, + "args": { + "External id": 233610,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115840965.336, "dur": 39.318, + "args": { + "External id": 233611,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841014.132, "dur": 26.255, + "args": { + "External id": 233612,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841045.987, "dur": 32.861, + "args": { + "External id": 233613,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841086.538, "dur": 20.428, + "args": { + "External id": 233614,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841113.649, "dur": 28.342, + "args": { + "External id": 233615,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115841163.863, "dur": 21.208, + "args": { + "External id": 233616,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115841202.921, "dur": 26.638, + "args": { + "External id": 233617,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115841247.988, "dur": 19.360, + "args": { + "External id": 233618,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115841279.600, "dur": 14.165, + "args": { + "External id": 233619,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841302.115, "dur": 34.846, + "args": { + "External id": 233620,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841340.515, "dur": 30.028, + "args": { + "External id": 233621,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115841395.117, "dur": 176.414, + "args": { + "External id": 233622,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115841464.851, "dur": 5.963, + "args": { + "External id": 233623,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115841472.804, "dur": 2.814, + "args": { + "External id": 233624,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115841605.697, "dur": 24.106, + "args": { + "External id": 233625,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115841643.029, "dur": 49.210, + "args": { + "External id": 233626,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841704.342, "dur": 50.376, + "args": { + "External id": 233627,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841763.003, "dur": 32.085, + "args": { + "External id": 233628,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841801.435, "dur": 27.719, + "args": { + "External id": 233629,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841833.467, "dur": 27.903, + "args": { + "External id": 233630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841866.605, "dur": 27.066, + "args": { + "External id": 233631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115841901.858, "dur": 27.526, + "args": { + "External id": 233632,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115841947.183, "dur": 38.424, + "args": { + "External id": 233633,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115842010.644, "dur": 25.101, + "args": { + "External id": 233634,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115842049.946, "dur": 15.737, + "args": { + "External id": 233635,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115842081.189, "dur": 17.072, + "args": { + "External id": 233636,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115842111.075, "dur": 15.758, + "args": { + "External id": 233637,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842199.934, "dur": 18.991, + "args": { + "External id": 233638,"Record function id": 0, "Ev Idx": 3749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842202.865, "dur": 15.231, + "args": { + "External id": 233639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842210.397, "dur": 6.565, + "args": { + "External id": 233640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842211.958, "dur": 4.891, + "args": { + "External id": 233641,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842222.636, "dur": 5.317, + "args": { + "External id": 233642,"Record function id": 0, "Ev Idx": 3753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842224.519, "dur": 2.998, + "args": { + "External id": 233643,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842225.295, "dur": 1.554, + "args": { + "External id": 233644,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842225.788, "dur": 0.982, + "args": { + "External id": 233645,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842231.060, "dur": 3.855, + "args": { + "External id": 233646,"Record function id": 0, "Ev Idx": 3757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842232.163, "dur": 2.328, + "args": { + "External id": 233647,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842232.862, "dur": 1.236, + "args": { + "External id": 233648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842233.276, "dur": 0.718, + "args": { + "External id": 233649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842238.008, "dur": 6.036, + "args": { + "External id": 233650,"Record function id": 0, "Ev Idx": 3761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842239.183, "dur": 4.446, + "args": { + "External id": 233651,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842239.860, "dur": 3.340, + "args": { + "External id": 233652,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842240.168, "dur": 2.941, + "args": { + "External id": 233653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842247.055, "dur": 4.293, + "args": { + "External id": 233654,"Record function id": 0, "Ev Idx": 3765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842248.380, "dur": 2.528, + "args": { + "External id": 233655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842249.026, "dur": 1.478, + "args": { + "External id": 233656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842249.514, "dur": 0.931, + "args": { + "External id": 233657,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842254.422, "dur": 4.489, + "args": { + "External id": 233658,"Record function id": 0, "Ev Idx": 3769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842255.934, "dur": 2.584, + "args": { + "External id": 233659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842256.549, "dur": 1.439, + "args": { + "External id": 233660,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842257.235, "dur": 0.689, + "args": { + "External id": 233661,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842262.297, "dur": 7.758, + "args": { + "External id": 233662,"Record function id": 0, "Ev Idx": 3773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842266.674, "dur": 2.951, + "args": { + "External id": 233663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842267.565, "dur": 1.657, + "args": { + "External id": 233664,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842268.124, "dur": 1.026, + "args": { + "External id": 233665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842273.047, "dur": 4.584, + "args": { + "External id": 233666,"Record function id": 0, "Ev Idx": 3777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842274.614, "dur": 2.606, + "args": { + "External id": 233667,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842275.254, "dur": 1.544, + "args": { + "External id": 233668,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842275.944, "dur": 0.790, + "args": { + "External id": 233669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842281.011, "dur": 4.721, + "args": { + "External id": 233670,"Record function id": 0, "Ev Idx": 3781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115842282.180, "dur": 3.140, + "args": { + "External id": 233671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115842282.673, "dur": 2.231, + "args": { + "External id": 233672,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115842283.882, "dur": 0.959, + "args": { + "External id": 233673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115842289.947, "dur": 15237.669, + "args": { + "External id": 233674,"Record function id": 0, "Sequence number": 2757755, "Fwd thread id": 1, "Ev Idx": 3785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115842291.388, "dur": 15226.700, + "args": { + "External id": 233675,"Sequence number": 2757755, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3786 + } + }, + { + "ph": "f", "id": 201, "pid": 4183442, "tid": 31331, "ts": 667115842291.388, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.5)", "pid": 4183442, "tid": 31331, + "ts": 667115842320.350, "dur": 40.445, + "args": { + "External id": 233676,"Record function id": 0, "Ev Idx": 3787 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.5)", "pid": 4183442, "tid": 31331, + "ts": 667115842367.927, "dur": 67.772, + "args": { + "External id": 233677,"Record function id": 0, "Ev Idx": 3788 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.5)", "pid": 4183442, "tid": 31331, + "ts": 667115842441.237, "dur": 15068.817, + "args": { + "External id": 233678,"Record function id": 0, "Ev Idx": 3789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115842549.285, "dur": 8.140, + "args": { + "External id": 233679,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115842567.514, "dur": 4.991, + "args": { + "External id": 233680,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115842585.915, "dur": 14210.659, + "args": { + "External id": 233681,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115842603.078, "dur": 14184.955, + "args": { + "External id": 233682,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115842625.742, "dur": 15.845, + "args": { + "External id": 233683,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115842645.519, "dur": 14108.803, + "args": { + "External id": 233684,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115842647.650, "dur": 14105.982, + "args": { + "External id": 233685,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115842689.042, "dur": 5.592, + "args": { + "External id": 233686,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115842696.468, "dur": 14053.685, + "args": { + "External id": 233687,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115856883.392, "dur": 8.744, + "args": { + "External id": 233688,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115856886.020, "dur": 5.811, + "args": { + "External id": 233689,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115856919.998, "dur": 306.387, + "args": { + "External id": 233690,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115856945.709, "dur": 276.367, + "args": { + "External id": 233691,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3802, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115856956.082, "dur": 261.716, + "args": { + "External id": 233692,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115857242.807, "dur": 2.089, + "args": { + "External id": 233693,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3804, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857294.298, "dur": 5.803, + "args": { + "External id": 233694,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857344.223, "dur": 1.464, + "args": { + "External id": 233695,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857360.612, "dur": 1.693, + "args": { + "External id": 233696,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857373.944, "dur": 2.786, + "args": { + "External id": 233697,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857387.178, "dur": 0.755, + "args": { + "External id": 233698,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857398.343, "dur": 0.846, + "args": { + "External id": 233699,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857410.191, "dur": 0.760, + "args": { + "External id": 233700,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857422.036, "dur": 3.146, + "args": { + "External id": 233701,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857436.175, "dur": 0.971, + "args": { + "External id": 233702,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115857542.308, "dur": 2582.716, + "args": { + "External id": 233703,"Record function id": 0, "Ev Idx": 3814 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.4)", "pid": 4183442, "tid": 31331, + "ts": 667115857563.198, "dur": 984.257, + "args": { + "External id": 233704,"Record function id": 0, "Ev Idx": 3815 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 4183442, "tid": 31331, + "ts": 667115857576.600, "dur": 340.124, + "args": { + "External id": 233705,"Record function id": 0, "Ev Idx": 3816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857699.009, "dur": 5.269, + "args": { + "External id": 233706,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857707.994, "dur": 1.492, + "args": { + "External id": 233707,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857711.281, "dur": 1.243, + "args": { + "External id": 233708,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857714.213, "dur": 1.178, + "args": { + "External id": 233709,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857717.065, "dur": 2.980, + "args": { + "External id": 233710,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857721.381, "dur": 1.445, + "args": { + "External id": 233711,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857724.630, "dur": 1.268, + "args": { + "External id": 233712,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857727.383, "dur": 1.308, + "args": { + "External id": 233713,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857730.560, "dur": 1.278, + "args": { + "External id": 233714,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115857733.917, "dur": 1.369, + "args": { + "External id": 233715,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115857754.020, "dur": 133.245, + "args": { + "External id": 233716,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115857769.484, "dur": 113.528, + "args": { + "External id": 233717,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115857781.957, "dur": 13.353, + "args": { + "External id": 233718,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115857797.831, "dur": 60.988, + "args": { + "External id": 233719,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115857800.221, "dur": 58.272, + "args": { + "External id": 233720,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115857803.960, "dur": 5.470, + "args": { + "External id": 233721,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115857810.917, "dur": 47.128, + "args": { + "External id": 233722,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3833 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.3", "pid": 4183442, "tid": 31331, + "ts": 667115858001.840, "dur": 538.195, + "args": { + "External id": 233723,"Record function id": 0, "Ev Idx": 3834 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 4183442, "tid": 31331, + "ts": 667115858018.024, "dur": 508.445, + "args": { + "External id": 233724,"Record function id": 0, "Ev Idx": 3835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115858078.514, "dur": 5.953, + "args": { + "External id": 233725,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115858097.881, "dur": 29.737, + "args": { + "External id": 233726,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858102.590, "dur": 1.645, + "args": { + "External id": 233727,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858105.986, "dur": 0.774, + "args": { + "External id": 233728,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858108.621, "dur": 0.679, + "args": { + "External id": 233729,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858110.906, "dur": 0.462, + "args": { + "External id": 233730,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858113.091, "dur": 0.368, + "args": { + "External id": 233731,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858114.628, "dur": 0.467, + "args": { + "External id": 233732,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858116.672, "dur": 0.294, + "args": { + "External id": 233733,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858118.000, "dur": 2.497, + "args": { + "External id": 233734,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858122.215, "dur": 0.593, + "args": { + "External id": 233735,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115858137.467, "dur": 31.432, + "args": { + "External id": 233736,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115858197.016, "dur": 91.161, + "args": { + "External id": 233737,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115858205.855, "dur": 3.455, + "args": { + "External id": 233738,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115858214.035, "dur": 9.909, + "args": { + "External id": 233739,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115858218.096, "dur": 5.448, + "args": { + "External id": 233740,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858221.283, "dur": 1.024, + "args": { + "External id": 233741,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115858230.162, "dur": 23.684, + "args": { + "External id": 233742,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858231.529, "dur": 0.877, + "args": { + "External id": 233743,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858233.696, "dur": 0.521, + "args": { + "External id": 233744,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858236.279, "dur": 0.863, + "args": { + "External id": 233745,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858238.582, "dur": 0.692, + "args": { + "External id": 233746,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858240.442, "dur": 1.773, + "args": { + "External id": 233747,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858243.476, "dur": 0.633, + "args": { + "External id": 233748,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858245.589, "dur": 0.329, + "args": { + "External id": 233749,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858246.956, "dur": 0.412, + "args": { + "External id": 233750,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115858248.844, "dur": 0.773, + "args": { + "External id": 233751,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115858263.557, "dur": 17.837, + "args": { + "External id": 233752,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115858330.912, "dur": 106.623, + "args": { + "External id": 233753,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115858354.992, "dur": 79.372, + "args": { + "External id": 233754,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3865, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115858363.403, "dur": 66.621, + "args": { + "External id": 233755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115858454.025, "dur": 1.698, + "args": { + "External id": 233756,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3867, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115858555.431, "dur": 1546.117, + "args": { + "External id": 233757,"Sequence number": 2757754, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3868 + } + }, + { + "ph": "f", "id": 202, "pid": 4183442, "tid": 31331, "ts": 667115858555.431, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115858701.594, "dur": 101.982, + "args": { + "External id": 233758,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115858847.998, "dur": 37.376, + "args": { + "External id": 233759,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115858901.885, "dur": 38.930, + "args": { + "External id": 233760,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115858950.372, "dur": 26.027, + "args": { + "External id": 233761,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115858982.582, "dur": 32.951, + "args": { + "External id": 233762,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859023.939, "dur": 20.366, + "args": { + "External id": 233763,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859051.169, "dur": 28.795, + "args": { + "External id": 233764,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115859101.694, "dur": 21.627, + "args": { + "External id": 233765,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115859139.497, "dur": 26.003, + "args": { + "External id": 233766,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115859184.649, "dur": 17.292, + "args": { + "External id": 233767,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115859214.424, "dur": 14.179, + "args": { + "External id": 233768,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859238.124, "dur": 35.322, + "args": { + "External id": 233769,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859276.601, "dur": 29.689, + "args": { + "External id": 233770,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115859332.684, "dur": 186.625, + "args": { + "External id": 233771,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115859408.215, "dur": 6.308, + "args": { + "External id": 233772,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115859416.590, "dur": 3.106, + "args": { + "External id": 233773,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115859554.624, "dur": 28.573, + "args": { + "External id": 233774,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115859594.431, "dur": 14.216, + "args": { + "External id": 233775,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859617.132, "dur": 83.963, + "args": { + "External id": 233776,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859711.885, "dur": 35.613, + "args": { + "External id": 233777,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859754.682, "dur": 28.042, + "args": { + "External id": 233778,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859787.668, "dur": 28.606, + "args": { + "External id": 233779,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859822.449, "dur": 26.453, + "args": { + "External id": 233780,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115859857.981, "dur": 28.531, + "args": { + "External id": 233781,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115859905.170, "dur": 24.930, + "args": { + "External id": 233782,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115859951.590, "dur": 23.643, + "args": { + "External id": 233783,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115859991.165, "dur": 21.423, + "args": { + "External id": 233784,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115860026.586, "dur": 15.868, + "args": { + "External id": 233785,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115860054.053, "dur": 19.315, + "args": { + "External id": 233786,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860145.779, "dur": 14.470, + "args": { + "External id": 233787,"Record function id": 0, "Ev Idx": 3898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860148.954, "dur": 10.461, + "args": { + "External id": 233788,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860152.883, "dur": 5.487, + "args": { + "External id": 233789,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860154.261, "dur": 3.985, + "args": { + "External id": 233790,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860164.162, "dur": 5.194, + "args": { + "External id": 233791,"Record function id": 0, "Ev Idx": 3902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860165.583, "dur": 3.188, + "args": { + "External id": 233792,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860166.487, "dur": 1.714, + "args": { + "External id": 233793,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860167.260, "dur": 0.853, + "args": { + "External id": 233794,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860172.616, "dur": 4.056, + "args": { + "External id": 233795,"Record function id": 0, "Ev Idx": 3906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860173.616, "dur": 2.640, + "args": { + "External id": 233796,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860174.264, "dur": 1.563, + "args": { + "External id": 233797,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860174.703, "dur": 1.004, + "args": { + "External id": 233798,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860179.815, "dur": 5.684, + "args": { + "External id": 233799,"Record function id": 0, "Ev Idx": 3910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860181.256, "dur": 3.790, + "args": { + "External id": 233800,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860182.086, "dur": 2.556, + "args": { + "External id": 233801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860182.401, "dur": 2.149, + "args": { + "External id": 233802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860188.647, "dur": 4.205, + "args": { + "External id": 233803,"Record function id": 0, "Ev Idx": 3914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860189.986, "dur": 2.400, + "args": { + "External id": 233804,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860190.486, "dur": 1.502, + "args": { + "External id": 233805,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860190.859, "dur": 1.057, + "args": { + "External id": 233806,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860195.960, "dur": 4.816, + "args": { + "External id": 233807,"Record function id": 0, "Ev Idx": 3918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860197.479, "dur": 2.858, + "args": { + "External id": 233808,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860198.214, "dur": 1.598, + "args": { + "External id": 233809,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860198.825, "dur": 0.912, + "args": { + "External id": 233810,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860204.106, "dur": 4.164, + "args": { + "External id": 233811,"Record function id": 0, "Ev Idx": 3922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860205.478, "dur": 2.364, + "args": { + "External id": 233812,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860206.105, "dur": 1.340, + "args": { + "External id": 233813,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860206.685, "dur": 0.692, + "args": { + "External id": 233814,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860211.335, "dur": 4.029, + "args": { + "External id": 233815,"Record function id": 0, "Ev Idx": 3926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860212.578, "dur": 2.378, + "args": { + "External id": 233816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860213.071, "dur": 1.453, + "args": { + "External id": 233817,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860213.694, "dur": 0.756, + "args": { + "External id": 233818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860218.390, "dur": 5.302, + "args": { + "External id": 233819,"Record function id": 0, "Ev Idx": 3930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115860219.459, "dur": 3.804, + "args": { + "External id": 233820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115860219.930, "dur": 2.934, + "args": { + "External id": 233821,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115860222.222, "dur": 0.549, + "args": { + "External id": 233822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115860227.925, "dur": 16836.174, + "args": { + "External id": 233823,"Record function id": 0, "Sequence number": 2757753, "Fwd thread id": 1, "Ev Idx": 3934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115860229.183, "dur": 16826.559, + "args": { + "External id": 233824,"Sequence number": 2757753, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3935 + } + }, + { + "ph": "f", "id": 203, "pid": 4183442, "tid": 31331, "ts": 667115860229.183, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.4)", "pid": 4183442, "tid": 31331, + "ts": 667115860257.457, "dur": 38.640, + "args": { + "External id": 233825,"Record function id": 0, "Ev Idx": 3936 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.4)", "pid": 4183442, "tid": 31331, + "ts": 667115860303.291, "dur": 65.908, + "args": { + "External id": 233826,"Record function id": 0, "Ev Idx": 3937 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.4)", "pid": 4183442, "tid": 31331, + "ts": 667115860375.004, "dur": 16673.841, + "args": { + "External id": 233827,"Record function id": 0, "Ev Idx": 3938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115860456.846, "dur": 6.365, + "args": { + "External id": 233828,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115860475.732, "dur": 4.730, + "args": { + "External id": 233829,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115860515.125, "dur": 15844.636, + "args": { + "External id": 233830,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115860529.137, "dur": 15821.774, + "args": { + "External id": 233831,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115860553.459, "dur": 16.339, + "args": { + "External id": 233832,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115860574.259, "dur": 15738.415, + "args": { + "External id": 233833,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115860576.765, "dur": 15735.138, + "args": { + "External id": 233834,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115860580.558, "dur": 5.355, + "args": { + "External id": 233835,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115860587.540, "dur": 15720.706, + "args": { + "External id": 233836,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115876446.336, "dur": 9.279, + "args": { + "External id": 233837,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115876449.238, "dur": 6.030, + "args": { + "External id": 233838,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115876481.100, "dur": 292.026, + "args": { + "External id": 233839,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115876521.696, "dur": 246.943, + "args": { + "External id": 233840,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3951, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115876533.504, "dur": 229.806, + "args": { + "External id": 233841,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115876791.095, "dur": 2.254, + "args": { + "External id": 233842,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3953, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876846.487, "dur": 6.268, + "args": { + "External id": 233843,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876901.305, "dur": 1.701, + "args": { + "External id": 233844,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876918.347, "dur": 1.238, + "args": { + "External id": 233845,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876931.327, "dur": 2.114, + "args": { + "External id": 233846,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876944.000, "dur": 1.007, + "args": { + "External id": 233847,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876954.316, "dur": 0.693, + "args": { + "External id": 233848,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876965.013, "dur": 0.933, + "args": { + "External id": 233849,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876976.373, "dur": 2.378, + "args": { + "External id": 233850,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115876988.466, "dur": 0.923, + "args": { + "External id": 233851,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115877077.205, "dur": 2647.636, + "args": { + "External id": 233852,"Record function id": 0, "Ev Idx": 3963 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.3)", "pid": 4183442, "tid": 31331, + "ts": 667115877096.465, "dur": 970.377, + "args": { + "External id": 233853,"Record function id": 0, "Ev Idx": 3964 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 4183442, "tid": 31331, + "ts": 667115877110.488, "dur": 283.336, + "args": { + "External id": 233854,"Record function id": 0, "Ev Idx": 3965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877189.653, "dur": 4.061, + "args": { + "External id": 233855,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877196.945, "dur": 1.296, + "args": { + "External id": 233856,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877200.146, "dur": 1.067, + "args": { + "External id": 233857,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877202.866, "dur": 1.212, + "args": { + "External id": 233858,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877205.652, "dur": 1.882, + "args": { + "External id": 233859,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877208.875, "dur": 1.013, + "args": { + "External id": 233860,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877211.559, "dur": 0.688, + "args": { + "External id": 233861,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877213.908, "dur": 0.892, + "args": { + "External id": 233862,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877216.443, "dur": 0.879, + "args": { + "External id": 233863,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115877218.923, "dur": 0.780, + "args": { + "External id": 233864,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115877236.352, "dur": 132.245, + "args": { + "External id": 233865,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115877250.770, "dur": 114.243, + "args": { + "External id": 233866,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115877262.136, "dur": 12.682, + "args": { + "External id": 233867,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115877277.520, "dur": 58.617, + "args": { + "External id": 233868,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115877280.120, "dur": 55.691, + "args": { + "External id": 233869,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877283.580, "dur": 5.242, + "args": { + "External id": 233870,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115877290.535, "dur": 44.514, + "args": { + "External id": 233871,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3982 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.2", "pid": 4183442, "tid": 31331, + "ts": 667115877475.207, "dur": 583.848, + "args": { + "External id": 233872,"Record function id": 0, "Ev Idx": 3983 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 4183442, "tid": 31331, + "ts": 667115877490.381, "dur": 556.697, + "args": { + "External id": 233873,"Record function id": 0, "Ev Idx": 3984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115877570.733, "dur": 6.442, + "args": { + "External id": 233874,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115877591.418, "dur": 29.217, + "args": { + "External id": 233875,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877596.032, "dur": 1.550, + "args": { + "External id": 233876,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877599.658, "dur": 0.665, + "args": { + "External id": 233877,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877601.819, "dur": 0.695, + "args": { + "External id": 233878,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877604.147, "dur": 0.452, + "args": { + "External id": 233879,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877605.773, "dur": 1.135, + "args": { + "External id": 233880,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877608.507, "dur": 0.773, + "args": { + "External id": 233881,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877610.535, "dur": 1.111, + "args": { + "External id": 233882,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877613.355, "dur": 0.874, + "args": { + "External id": 233883,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877615.304, "dur": 0.876, + "args": { + "External id": 233884,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115877631.098, "dur": 69.189, + "args": { + "External id": 233885,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115877734.275, "dur": 105.578, + "args": { + "External id": 233886,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115877744.714, "dur": 4.370, + "args": { + "External id": 233887,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115877754.140, "dur": 10.334, + "args": { + "External id": 233888,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115877758.297, "dur": 5.756, + "args": { + "External id": 233889,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877761.488, "dur": 1.051, + "args": { + "External id": 233890,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115877774.466, "dur": 24.435, + "args": { + "External id": 233891,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877777.009, "dur": 0.933, + "args": { + "External id": 233892,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877779.854, "dur": 0.635, + "args": { + "External id": 233893,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877782.773, "dur": 0.733, + "args": { + "External id": 233894,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877784.752, "dur": 0.636, + "args": { + "External id": 233895,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877786.899, "dur": 0.827, + "args": { + "External id": 233896,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877789.272, "dur": 0.629, + "args": { + "External id": 233897,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877791.965, "dur": 0.550, + "args": { + "External id": 233898,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877793.647, "dur": 0.651, + "args": { + "External id": 233899,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115877795.812, "dur": 0.486, + "args": { + "External id": 233900,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115877808.600, "dur": 20.963, + "args": { + "External id": 233901,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115877883.507, "dur": 102.748, + "args": { + "External id": 233902,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115877903.942, "dur": 79.180, + "args": { + "External id": 233903,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4014, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115877912.724, "dur": 66.432, + "args": { + "External id": 233904,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115877998.620, "dur": 1.967, + "args": { + "External id": 233905,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4016, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115878073.937, "dur": 1628.847, + "args": { + "External id": 233906,"Sequence number": 2757752, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4017 + } + }, + { + "ph": "f", "id": 204, "pid": 4183442, "tid": 31331, "ts": 667115878073.937, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115878190.432, "dur": 98.120, + "args": { + "External id": 233907,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115878323.837, "dur": 38.358, + "args": { + "External id": 233908,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115878379.589, "dur": 44.590, + "args": { + "External id": 233909,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115878433.565, "dur": 28.055, + "args": { + "External id": 233910,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115878467.261, "dur": 60.018, + "args": { + "External id": 233911,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115878537.268, "dur": 28.515, + "args": { + "External id": 233912,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115878573.150, "dur": 29.642, + "args": { + "External id": 233913,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115878629.469, "dur": 63.048, + "args": { + "External id": 233914,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115878712.910, "dur": 29.181, + "args": { + "External id": 233915,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115878761.647, "dur": 20.097, + "args": { + "External id": 233916,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115878794.328, "dur": 16.647, + "args": { + "External id": 233917,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115878819.142, "dur": 42.017, + "args": { + "External id": 233918,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115878864.695, "dur": 31.226, + "args": { + "External id": 233919,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115878926.064, "dur": 175.777, + "args": { + "External id": 233920,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115879003.771, "dur": 6.230, + "args": { + "External id": 233921,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115879011.897, "dur": 3.729, + "args": { + "External id": 233922,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115879132.882, "dur": 24.653, + "args": { + "External id": 233923,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115879168.995, "dur": 14.093, + "args": { + "External id": 233924,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115879190.979, "dur": 42.044, + "args": { + "External id": 233925,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115879239.145, "dur": 31.966, + "args": { + "External id": 233926,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115879277.366, "dur": 27.665, + "args": { + "External id": 233927,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115879309.630, "dur": 27.557, + "args": { + "External id": 233928,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115879342.458, "dur": 27.241, + "args": { + "External id": 233929,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115879379.312, "dur": 27.781, + "args": { + "External id": 233930,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115879422.562, "dur": 24.701, + "args": { + "External id": 233931,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115879462.748, "dur": 21.721, + "args": { + "External id": 233932,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115879540.106, "dur": 31.033, + "args": { + "External id": 233933,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115879588.241, "dur": 15.200, + "args": { + "External id": 233934,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115879620.128, "dur": 16.820, + "args": { + "External id": 233935,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879746.696, "dur": 18.665, + "args": { + "External id": 233936,"Record function id": 0, "Ev Idx": 4047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879753.034, "dur": 11.446, + "args": { + "External id": 233937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879757.365, "dur": 6.145, + "args": { + "External id": 233938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879758.903, "dur": 4.495, + "args": { + "External id": 233939,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879769.434, "dur": 4.893, + "args": { + "External id": 233940,"Record function id": 0, "Ev Idx": 4051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879771.160, "dur": 2.692, + "args": { + "External id": 233941,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879771.854, "dur": 1.559, + "args": { + "External id": 233942,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879772.346, "dur": 0.968, + "args": { + "External id": 233943,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879777.558, "dur": 4.766, + "args": { + "External id": 233944,"Record function id": 0, "Ev Idx": 4055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879778.926, "dur": 2.962, + "args": { + "External id": 233945,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879779.639, "dur": 1.730, + "args": { + "External id": 233946,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879780.418, "dur": 0.864, + "args": { + "External id": 233947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879785.646, "dur": 4.780, + "args": { + "External id": 233948,"Record function id": 0, "Ev Idx": 4059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879787.098, "dur": 2.915, + "args": { + "External id": 233949,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879788.087, "dur": 1.333, + "args": { + "External id": 233950,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879788.504, "dur": 0.809, + "args": { + "External id": 233951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879793.598, "dur": 5.067, + "args": { + "External id": 233952,"Record function id": 0, "Ev Idx": 4063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879795.162, "dur": 3.054, + "args": { + "External id": 233953,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879796.165, "dur": 1.657, + "args": { + "External id": 233954,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879796.780, "dur": 0.899, + "args": { + "External id": 233955,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879801.885, "dur": 8.213, + "args": { + "External id": 233956,"Record function id": 0, "Ev Idx": 4067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879803.149, "dur": 3.259, + "args": { + "External id": 233957,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879803.944, "dur": 1.879, + "args": { + "External id": 233958,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879804.930, "dur": 0.792, + "args": { + "External id": 233959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879813.281, "dur": 3.800, + "args": { + "External id": 233960,"Record function id": 0, "Ev Idx": 4071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879814.377, "dur": 2.299, + "args": { + "External id": 233961,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879814.890, "dur": 1.365, + "args": { + "External id": 233962,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879815.240, "dur": 0.916, + "args": { + "External id": 233963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879820.138, "dur": 4.525, + "args": { + "External id": 233964,"Record function id": 0, "Ev Idx": 4075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879821.496, "dur": 2.766, + "args": { + "External id": 233965,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879822.338, "dur": 1.371, + "args": { + "External id": 233966,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879822.640, "dur": 1.004, + "args": { + "External id": 233967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879827.978, "dur": 3.693, + "args": { + "External id": 233968,"Record function id": 0, "Ev Idx": 4079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115879829.076, "dur": 2.189, + "args": { + "External id": 233969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115879829.593, "dur": 1.239, + "args": { + "External id": 233970,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115879829.941, "dur": 0.788, + "args": { + "External id": 233971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115879835.822, "dur": 14691.497, + "args": { + "External id": 233972,"Record function id": 0, "Sequence number": 2757751, "Fwd thread id": 1, "Ev Idx": 4083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115879837.202, "dur": 14680.663, + "args": { + "External id": 233973,"Sequence number": 2757751, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4084 + } + }, + { + "ph": "f", "id": 205, "pid": 4183442, "tid": 31331, "ts": 667115879837.202, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.3)", "pid": 4183442, "tid": 31331, + "ts": 667115879867.953, "dur": 37.614, + "args": { + "External id": 233974,"Record function id": 0, "Ev Idx": 4085 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.3)", "pid": 4183442, "tid": 31331, + "ts": 667115879913.724, "dur": 65.893, + "args": { + "External id": 233975,"Record function id": 0, "Ev Idx": 4086 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.3)", "pid": 4183442, "tid": 31331, + "ts": 667115879985.237, "dur": 14524.333, + "args": { + "External id": 233976,"Record function id": 0, "Ev Idx": 4087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115880069.757, "dur": 6.769, + "args": { + "External id": 233977,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115880085.447, "dur": 8.751, + "args": { + "External id": 233978,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115880107.518, "dur": 13751.086, + "args": { + "External id": 233979,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115880120.463, "dur": 13730.280, + "args": { + "External id": 233980,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115880141.776, "dur": 16.977, + "args": { + "External id": 233981,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115880162.956, "dur": 13646.633, + "args": { + "External id": 233982,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115880165.494, "dur": 13643.278, + "args": { + "External id": 233983,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115880168.891, "dur": 4.651, + "args": { + "External id": 233984,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115880188.012, "dur": 13616.873, + "args": { + "External id": 233985,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115893949.006, "dur": 9.929, + "args": { + "External id": 233986,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115893951.835, "dur": 6.702, + "args": { + "External id": 233987,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115893983.874, "dur": 240.038, + "args": { + "External id": 233988,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115894009.096, "dur": 210.921, + "args": { + "External id": 233989,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4100, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115894019.499, "dur": 196.021, + "args": { + "External id": 233990,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115894240.090, "dur": 1.868, + "args": { + "External id": 233991,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4102, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894290.035, "dur": 5.845, + "args": { + "External id": 233992,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894340.386, "dur": 1.787, + "args": { + "External id": 233993,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894357.601, "dur": 1.150, + "args": { + "External id": 233994,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894370.290, "dur": 0.911, + "args": { + "External id": 233995,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894382.534, "dur": 0.914, + "args": { + "External id": 233996,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894394.135, "dur": 0.881, + "args": { + "External id": 233997,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894408.077, "dur": 1.177, + "args": { + "External id": 233998,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894420.950, "dur": 1.002, + "args": { + "External id": 233999,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894432.219, "dur": 1.360, + "args": { + "External id": 234000,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115894542.473, "dur": 2651.678, + "args": { + "External id": 234001,"Record function id": 0, "Ev Idx": 4112 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.2)", "pid": 4183442, "tid": 31331, + "ts": 667115894564.079, "dur": 1001.871, + "args": { + "External id": 234002,"Record function id": 0, "Ev Idx": 4113 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 4183442, "tid": 31331, + "ts": 667115894578.625, "dur": 338.527, + "args": { + "External id": 234003,"Record function id": 0, "Ev Idx": 4114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894698.324, "dur": 4.933, + "args": { + "External id": 234004,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894706.696, "dur": 1.133, + "args": { + "External id": 234005,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894709.850, "dur": 1.048, + "args": { + "External id": 234006,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894712.696, "dur": 1.021, + "args": { + "External id": 234007,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894715.383, "dur": 0.806, + "args": { + "External id": 234008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894717.946, "dur": 0.946, + "args": { + "External id": 234009,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894720.503, "dur": 1.140, + "args": { + "External id": 234010,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894723.476, "dur": 0.954, + "args": { + "External id": 234011,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894726.449, "dur": 1.178, + "args": { + "External id": 234012,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115894729.177, "dur": 0.999, + "args": { + "External id": 234013,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115894748.888, "dur": 138.688, + "args": { + "External id": 234014,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115894764.641, "dur": 118.751, + "args": { + "External id": 234015,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115894777.210, "dur": 14.626, + "args": { + "External id": 234016,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115894794.659, "dur": 60.907, + "args": { + "External id": 234017,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115894797.323, "dur": 57.971, + "args": { + "External id": 234018,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115894800.894, "dur": 5.519, + "args": { + "External id": 234019,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115894807.872, "dur": 46.618, + "args": { + "External id": 234020,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4131 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.1", "pid": 4183442, "tid": 31331, + "ts": 667115895006.620, "dur": 551.271, + "args": { + "External id": 234021,"Record function id": 0, "Ev Idx": 4132 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 4183442, "tid": 31331, + "ts": 667115895023.349, "dur": 521.976, + "args": { + "External id": 234022,"Record function id": 0, "Ev Idx": 4133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115895086.158, "dur": 4.868, + "args": { + "External id": 234023,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115895105.354, "dur": 32.418, + "args": { + "External id": 234024,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895109.511, "dur": 1.834, + "args": { + "External id": 234025,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895113.884, "dur": 1.135, + "args": { + "External id": 234026,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895116.561, "dur": 0.543, + "args": { + "External id": 234027,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895118.386, "dur": 0.738, + "args": { + "External id": 234028,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895120.351, "dur": 0.906, + "args": { + "External id": 234029,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895122.701, "dur": 0.916, + "args": { + "External id": 234030,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895131.369, "dur": 0.822, + "args": { + "External id": 234031,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895132.979, "dur": 0.618, + "args": { + "External id": 234032,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895134.636, "dur": 0.626, + "args": { + "External id": 234033,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115895148.288, "dur": 32.651, + "args": { + "External id": 234034,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115895209.877, "dur": 94.345, + "args": { + "External id": 234035,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115895218.639, "dur": 3.434, + "args": { + "External id": 234036,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115895227.263, "dur": 9.113, + "args": { + "External id": 234037,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115895231.124, "dur": 4.816, + "args": { + "External id": 234038,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895234.323, "dur": 0.502, + "args": { + "External id": 234039,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115895244.265, "dur": 24.653, + "args": { + "External id": 234040,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895246.165, "dur": 0.604, + "args": { + "External id": 234041,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895248.095, "dur": 0.714, + "args": { + "External id": 234042,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895250.255, "dur": 0.603, + "args": { + "External id": 234043,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895251.903, "dur": 0.745, + "args": { + "External id": 234044,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895254.252, "dur": 0.905, + "args": { + "External id": 234045,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895256.199, "dur": 0.706, + "args": { + "External id": 234046,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895257.998, "dur": 0.622, + "args": { + "External id": 234047,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895259.591, "dur": 0.865, + "args": { + "External id": 234048,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115895261.998, "dur": 0.793, + "args": { + "External id": 234049,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115895277.764, "dur": 19.626, + "args": { + "External id": 234050,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115895346.820, "dur": 110.178, + "args": { + "External id": 234051,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115895369.830, "dur": 83.685, + "args": { + "External id": 234052,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4163, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115895378.559, "dur": 71.170, + "args": { + "External id": 234053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115895469.635, "dur": 1.820, + "args": { + "External id": 234054,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4165, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115895573.859, "dur": 1599.595, + "args": { + "External id": 234055,"Sequence number": 2757750, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4166 + } + }, + { + "ph": "f", "id": 206, "pid": 4183442, "tid": 31331, "ts": 667115895573.859, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115895721.166, "dur": 109.370, + "args": { + "External id": 234056,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115895871.303, "dur": 40.920, + "args": { + "External id": 234057,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115895928.773, "dur": 41.400, + "args": { + "External id": 234058,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115895979.223, "dur": 27.291, + "args": { + "External id": 234059,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896012.523, "dur": 34.260, + "args": { + "External id": 234060,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896053.221, "dur": 21.937, + "args": { + "External id": 234061,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896085.303, "dur": 28.748, + "args": { + "External id": 234062,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115896136.317, "dur": 24.360, + "args": { + "External id": 234063,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115896186.019, "dur": 28.293, + "args": { + "External id": 234064,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115896231.201, "dur": 19.616, + "args": { + "External id": 234065,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115896263.044, "dur": 15.677, + "args": { + "External id": 234066,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896286.065, "dur": 36.940, + "args": { + "External id": 234067,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896326.122, "dur": 30.634, + "args": { + "External id": 234068,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115896382.333, "dur": 183.402, + "args": { + "External id": 234069,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115896457.267, "dur": 5.780, + "args": { + "External id": 234070,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115896464.895, "dur": 3.017, + "args": { + "External id": 234071,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115896599.059, "dur": 25.221, + "args": { + "External id": 234072,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115896635.743, "dur": 14.796, + "args": { + "External id": 234073,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896698.951, "dur": 56.114, + "args": { + "External id": 234074,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896762.118, "dur": 36.198, + "args": { + "External id": 234075,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896805.200, "dur": 28.798, + "args": { + "External id": 234076,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896842.485, "dur": 28.032, + "args": { + "External id": 234077,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896875.960, "dur": 28.706, + "args": { + "External id": 234078,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115896911.721, "dur": 35.954, + "args": { + "External id": 234079,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115896973.634, "dur": 32.478, + "args": { + "External id": 234080,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115897024.232, "dur": 26.847, + "args": { + "External id": 234081,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115897067.112, "dur": 17.041, + "args": { + "External id": 234082,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115897098.306, "dur": 17.888, + "args": { + "External id": 234083,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115897127.638, "dur": 15.807, + "args": { + "External id": 234084,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897214.787, "dur": 19.068, + "args": { + "External id": 234085,"Record function id": 0, "Ev Idx": 4196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897221.477, "dur": 11.478, + "args": { + "External id": 234086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897225.482, "dur": 6.572, + "args": { + "External id": 234087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897227.034, "dur": 4.910, + "args": { + "External id": 234088,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897237.520, "dur": 5.226, + "args": { + "External id": 234089,"Record function id": 0, "Ev Idx": 4200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897239.185, "dur": 3.047, + "args": { + "External id": 234090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897240.313, "dur": 1.426, + "args": { + "External id": 234091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897240.780, "dur": 0.875, + "args": { + "External id": 234092,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897246.007, "dur": 3.914, + "args": { + "External id": 234093,"Record function id": 0, "Ev Idx": 4204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897247.222, "dur": 2.313, + "args": { + "External id": 234094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897247.796, "dur": 1.363, + "args": { + "External id": 234095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897248.186, "dur": 0.883, + "args": { + "External id": 234096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897253.177, "dur": 4.548, + "args": { + "External id": 234097,"Record function id": 0, "Ev Idx": 4208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897254.782, "dur": 2.525, + "args": { + "External id": 234098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897255.612, "dur": 1.158, + "args": { + "External id": 234099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897255.904, "dur": 0.780, + "args": { + "External id": 234100,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897260.779, "dur": 4.200, + "args": { + "External id": 234101,"Record function id": 0, "Ev Idx": 4212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897262.014, "dur": 2.557, + "args": { + "External id": 234102,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897262.950, "dur": 1.227, + "args": { + "External id": 234103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897263.442, "dur": 0.670, + "args": { + "External id": 234104,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897268.057, "dur": 4.411, + "args": { + "External id": 234105,"Record function id": 0, "Ev Idx": 4216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897269.536, "dur": 2.513, + "args": { + "External id": 234106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897270.021, "dur": 1.505, + "args": { + "External id": 234107,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897270.555, "dur": 0.904, + "args": { + "External id": 234108,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897278.801, "dur": 4.259, + "args": { + "External id": 234109,"Record function id": 0, "Ev Idx": 4220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897279.930, "dur": 2.725, + "args": { + "External id": 234110,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897280.655, "dur": 1.540, + "args": { + "External id": 234111,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897281.395, "dur": 0.725, + "args": { + "External id": 234112,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897286.132, "dur": 4.294, + "args": { + "External id": 234113,"Record function id": 0, "Ev Idx": 4224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897287.229, "dur": 2.786, + "args": { + "External id": 234114,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897287.707, "dur": 1.628, + "args": { + "External id": 234115,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897288.363, "dur": 0.907, + "args": { + "External id": 234116,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897293.839, "dur": 4.558, + "args": { + "External id": 234117,"Record function id": 0, "Ev Idx": 4228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115897295.018, "dur": 2.952, + "args": { + "External id": 234118,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115897295.725, "dur": 1.857, + "args": { + "External id": 234119,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115897296.688, "dur": 0.829, + "args": { + "External id": 234120,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115897302.613, "dur": 14802.809, + "args": { + "External id": 234121,"Record function id": 0, "Sequence number": 2757749, "Fwd thread id": 1, "Ev Idx": 4232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115897303.926, "dur": 14792.949, + "args": { + "External id": 234122,"Sequence number": 2757749, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4233 + } + }, + { + "ph": "f", "id": 207, "pid": 4183442, "tid": 31331, "ts": 667115897303.926, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.2)", "pid": 4183442, "tid": 31331, + "ts": 667115897333.421, "dur": 37.840, + "args": { + "External id": 234123,"Record function id": 0, "Ev Idx": 4234 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.2)", "pid": 4183442, "tid": 31331, + "ts": 667115897378.837, "dur": 71.453, + "args": { + "External id": 234124,"Record function id": 0, "Ev Idx": 4235 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.2)", "pid": 4183442, "tid": 31331, + "ts": 667115897456.516, "dur": 14632.627, + "args": { + "External id": 234125,"Record function id": 0, "Ev Idx": 4236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115897563.295, "dur": 6.872, + "args": { + "External id": 234126,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115897579.957, "dur": 5.073, + "args": { + "External id": 234127,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115897599.323, "dur": 13747.654, + "args": { + "External id": 234128,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115897612.366, "dur": 13726.760, + "args": { + "External id": 234129,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115897635.788, "dur": 14.183, + "args": { + "External id": 234130,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115897688.747, "dur": 13616.058, + "args": { + "External id": 234131,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115897691.147, "dur": 13612.996, + "args": { + "External id": 234132,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115897694.930, "dur": 6.917, + "args": { + "External id": 234133,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115897706.998, "dur": 13593.938, + "args": { + "External id": 234134,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115911436.688, "dur": 8.622, + "args": { + "External id": 234135,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115911439.361, "dur": 5.644, + "args": { + "External id": 234136,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115911472.070, "dur": 333.235, + "args": { + "External id": 234137,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115911507.012, "dur": 293.274, + "args": { + "External id": 234138,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4249, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115911518.965, "dur": 276.064, + "args": { + "External id": 234139,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115911824.639, "dur": 2.374, + "args": { + "External id": 234140,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4251, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115911883.449, "dur": 6.320, + "args": { + "External id": 234141,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115911935.989, "dur": 1.371, + "args": { + "External id": 234142,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115911952.399, "dur": 1.275, + "args": { + "External id": 234143,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115911965.768, "dur": 1.158, + "args": { + "External id": 234144,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115911978.775, "dur": 1.276, + "args": { + "External id": 234145,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115911990.631, "dur": 1.162, + "args": { + "External id": 234146,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912003.199, "dur": 1.365, + "args": { + "External id": 234147,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912016.377, "dur": 1.153, + "args": { + "External id": 234148,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912027.433, "dur": 0.938, + "args": { + "External id": 234149,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115912118.247, "dur": 2671.926, + "args": { + "External id": 234150,"Record function id": 0, "Ev Idx": 4261 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.1)", "pid": 4183442, "tid": 31331, + "ts": 667115912137.906, "dur": 1011.280, + "args": { + "External id": 234151,"Record function id": 0, "Ev Idx": 4262 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 4183442, "tid": 31331, + "ts": 667115912152.076, "dur": 294.517, + "args": { + "External id": 234152,"Record function id": 0, "Ev Idx": 4263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912233.733, "dur": 3.911, + "args": { + "External id": 234153,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912240.864, "dur": 1.141, + "args": { + "External id": 234154,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912243.935, "dur": 0.871, + "args": { + "External id": 234155,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912246.509, "dur": 1.250, + "args": { + "External id": 234156,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912249.793, "dur": 1.072, + "args": { + "External id": 234157,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912252.571, "dur": 0.969, + "args": { + "External id": 234158,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912255.241, "dur": 1.188, + "args": { + "External id": 234159,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912258.132, "dur": 1.460, + "args": { + "External id": 234160,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912261.389, "dur": 1.097, + "args": { + "External id": 234161,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115912264.242, "dur": 1.847, + "args": { + "External id": 234162,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115912283.733, "dur": 137.781, + "args": { + "External id": 234163,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115912298.657, "dur": 118.877, + "args": { + "External id": 234164,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115912310.596, "dur": 13.093, + "args": { + "External id": 234165,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115912326.489, "dur": 63.538, + "args": { + "External id": 234166,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115912329.043, "dur": 60.605, + "args": { + "External id": 234167,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912334.149, "dur": 6.308, + "args": { + "External id": 234168,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115912343.604, "dur": 45.438, + "args": { + "External id": 234169,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4280 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.0", "pid": 4183442, "tid": 31331, + "ts": 667115912557.259, "dur": 584.495, + "args": { + "External id": 234170,"Record function id": 0, "Ev Idx": 4281 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 4183442, "tid": 31331, + "ts": 667115912573.183, "dur": 555.689, + "args": { + "External id": 234171,"Record function id": 0, "Ev Idx": 4282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115912635.844, "dur": 5.420, + "args": { + "External id": 234172,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115912693.012, "dur": 28.695, + "args": { + "External id": 234173,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912697.433, "dur": 1.625, + "args": { + "External id": 234174,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912701.376, "dur": 0.747, + "args": { + "External id": 234175,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912705.345, "dur": 0.746, + "args": { + "External id": 234176,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912707.251, "dur": 0.814, + "args": { + "External id": 234177,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912709.324, "dur": 0.759, + "args": { + "External id": 234178,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912712.421, "dur": 0.290, + "args": { + "External id": 234179,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912713.876, "dur": 0.573, + "args": { + "External id": 234180,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912715.617, "dur": 1.180, + "args": { + "External id": 234181,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912717.858, "dur": 0.733, + "args": { + "External id": 234182,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115912732.848, "dur": 35.307, + "args": { + "External id": 234183,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 31331, + "ts": 667115912802.274, "dur": 106.204, + "args": { + "External id": 234184,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115912812.957, "dur": 4.576, + "args": { + "External id": 234185,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 31331, + "ts": 667115912822.458, "dur": 9.334, + "args": { + "External id": 234186,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 31331, + "ts": 667115912826.316, "dur": 5.078, + "args": { + "External id": 234187,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912829.359, "dur": 0.867, + "args": { + "External id": 234188,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 31331, + "ts": 667115912838.728, "dur": 30.382, + "args": { + "External id": 234189,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912843.897, "dur": 0.575, + "args": { + "External id": 234190,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912845.966, "dur": 1.545, + "args": { + "External id": 234191,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912848.717, "dur": 1.233, + "args": { + "External id": 234192,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912851.096, "dur": 0.860, + "args": { + "External id": 234193,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912854.363, "dur": 0.757, + "args": { + "External id": 234194,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912856.037, "dur": 0.436, + "args": { + "External id": 234195,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912857.688, "dur": 0.953, + "args": { + "External id": 234196,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912860.488, "dur": 0.487, + "args": { + "External id": 234197,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115912861.852, "dur": 0.807, + "args": { + "External id": 234198,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 31331, + "ts": 667115912879.370, "dur": 19.035, + "args": { + "External id": 234199,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 31331, + "ts": 667115912953.872, "dur": 107.545, + "args": { + "External id": 234200,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115912976.970, "dur": 81.289, + "args": { + "External id": 234201,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4312, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 31331, + "ts": 667115912985.816, "dur": 68.577, + "args": { + "External id": 234202,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115913074.576, "dur": 1.751, + "args": { + "External id": 234203,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4314, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115913160.060, "dur": 1607.563, + "args": { + "External id": 234204,"Sequence number": 2757748, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4315 + } + }, + { + "ph": "f", "id": 208, "pid": 4183442, "tid": 31331, "ts": 667115913160.060, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115913270.738, "dur": 96.935, + "args": { + "External id": 234205,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115913404.899, "dur": 40.498, + "args": { + "External id": 234206,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115913461.537, "dur": 63.086, + "args": { + "External id": 234207,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115913537.505, "dur": 33.699, + "args": { + "External id": 234208,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115913577.454, "dur": 33.423, + "args": { + "External id": 234209,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115913617.349, "dur": 21.925, + "args": { + "External id": 234210,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115913646.322, "dur": 70.123, + "args": { + "External id": 234211,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115913743.870, "dur": 26.589, + "args": { + "External id": 234212,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115913789.568, "dur": 26.552, + "args": { + "External id": 234213,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115913838.881, "dur": 19.992, + "args": { + "External id": 234214,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115913871.337, "dur": 14.907, + "args": { + "External id": 234215,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115913899.658, "dur": 39.855, + "args": { + "External id": 234216,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115913942.860, "dur": 31.003, + "args": { + "External id": 234217,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115914000.584, "dur": 165.551, + "args": { + "External id": 234218,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115914073.615, "dur": 5.809, + "args": { + "External id": 234219,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115914081.205, "dur": 5.104, + "args": { + "External id": 234220,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115914196.620, "dur": 24.113, + "args": { + "External id": 234221,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115914232.076, "dur": 14.451, + "args": { + "External id": 234222,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115914254.063, "dur": 42.741, + "args": { + "External id": 234223,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115914302.851, "dur": 30.423, + "args": { + "External id": 234224,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115914339.279, "dur": 27.053, + "args": { + "External id": 234225,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115914373.888, "dur": 28.685, + "args": { + "External id": 234226,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115914408.070, "dur": 26.343, + "args": { + "External id": 234227,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115914442.028, "dur": 31.995, + "args": { + "External id": 234228,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115914487.733, "dur": 54.687, + "args": { + "External id": 234229,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115914572.128, "dur": 28.890, + "args": { + "External id": 234230,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115914615.877, "dur": 15.833, + "args": { + "External id": 234231,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115914683.834, "dur": 21.650, + "args": { + "External id": 234232,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115914720.561, "dur": 14.998, + "args": { + "External id": 234233,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914814.554, "dur": 15.567, + "args": { + "External id": 234234,"Record function id": 0, "Ev Idx": 4345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914818.122, "dur": 11.110, + "args": { + "External id": 234235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914822.207, "dur": 5.939, + "args": { + "External id": 234236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914823.768, "dur": 4.272, + "args": { + "External id": 234237,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914833.896, "dur": 5.742, + "args": { + "External id": 234238,"Record function id": 0, "Ev Idx": 4349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914835.673, "dur": 3.490, + "args": { + "External id": 234239,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914836.720, "dur": 1.919, + "args": { + "External id": 234240,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914837.520, "dur": 1.021, + "args": { + "External id": 234241,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914842.873, "dur": 5.453, + "args": { + "External id": 234242,"Record function id": 0, "Ev Idx": 4353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914844.659, "dur": 3.196, + "args": { + "External id": 234243,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914845.424, "dur": 2.036, + "args": { + "External id": 234244,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914846.232, "dur": 1.160, + "args": { + "External id": 234245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914851.533, "dur": 5.033, + "args": { + "External id": 234246,"Record function id": 0, "Ev Idx": 4357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914853.124, "dur": 2.981, + "args": { + "External id": 234247,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914853.885, "dur": 1.708, + "args": { + "External id": 234248,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914854.501, "dur": 1.025, + "args": { + "External id": 234249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914859.660, "dur": 5.339, + "args": { + "External id": 234250,"Record function id": 0, "Ev Idx": 4361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914861.488, "dur": 3.048, + "args": { + "External id": 234251,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914862.198, "dur": 1.951, + "args": { + "External id": 234252,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914862.905, "dur": 1.146, + "args": { + "External id": 234253,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914870.948, "dur": 3.473, + "args": { + "External id": 234254,"Record function id": 0, "Ev Idx": 4365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914871.901, "dur": 2.077, + "args": { + "External id": 234255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914872.494, "dur": 1.094, + "args": { + "External id": 234256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914872.785, "dur": 0.735, + "args": { + "External id": 234257,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914877.589, "dur": 4.127, + "args": { + "External id": 234258,"Record function id": 0, "Ev Idx": 4369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914878.761, "dur": 2.523, + "args": { + "External id": 234259,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914879.678, "dur": 1.218, + "args": { + "External id": 234260,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914880.141, "dur": 0.682, + "args": { + "External id": 234261,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914884.751, "dur": 4.125, + "args": { + "External id": 234262,"Record function id": 0, "Ev Idx": 4373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914885.924, "dur": 2.523, + "args": { + "External id": 234263,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914886.615, "dur": 1.415, + "args": { + "External id": 234264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914887.189, "dur": 0.769, + "args": { + "External id": 234265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914892.042, "dur": 4.199, + "args": { + "External id": 234266,"Record function id": 0, "Ev Idx": 4377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115914893.272, "dur": 2.549, + "args": { + "External id": 234267,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115914894.088, "dur": 1.277, + "args": { + "External id": 234268,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115914894.456, "dur": 0.837, + "args": { + "External id": 234269,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115914900.535, "dur": 14898.343, + "args": { + "External id": 234270,"Record function id": 0, "Sequence number": 2757747, "Fwd thread id": 1, "Ev Idx": 4381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115914901.862, "dur": 14889.033, + "args": { + "External id": 234271,"Sequence number": 2757747, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4382 + } + }, + { + "ph": "f", "id": 209, "pid": 4183442, "tid": 31331, "ts": 667115914901.862, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.1)", "pid": 4183442, "tid": 31331, + "ts": 667115914934.930, "dur": 39.200, + "args": { + "External id": 234272,"Record function id": 0, "Ev Idx": 4383 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.1)", "pid": 4183442, "tid": 31331, + "ts": 667115914981.367, "dur": 72.628, + "args": { + "External id": 234273,"Record function id": 0, "Ev Idx": 4384 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.1)", "pid": 4183442, "tid": 31331, + "ts": 667115915059.997, "dur": 14723.185, + "args": { + "External id": 234274,"Record function id": 0, "Ev Idx": 4385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115915138.672, "dur": 6.564, + "args": { + "External id": 234275,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115915157.858, "dur": 4.372, + "args": { + "External id": 234276,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115915175.305, "dur": 13923.726, + "args": { + "External id": 234277,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115915188.267, "dur": 13903.287, + "args": { + "External id": 234278,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115915211.181, "dur": 16.921, + "args": { + "External id": 234279,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115915231.812, "dur": 13826.657, + "args": { + "External id": 234280,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115915235.403, "dur": 13822.354, + "args": { + "External id": 234281,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115915238.934, "dur": 4.645, + "args": { + "External id": 234282,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115915245.138, "dur": 13809.231, + "args": { + "External id": 234283,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115929186.169, "dur": 9.725, + "args": { + "External id": 234284,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115929188.983, "dur": 6.611, + "args": { + "External id": 234285,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115929222.001, "dur": 237.222, + "args": { + "External id": 234286,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115929246.622, "dur": 208.674, + "args": { + "External id": 234287,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4398, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115929257.925, "dur": 192.727, + "args": { + "External id": 234288,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115929473.912, "dur": 1.872, + "args": { + "External id": 234289,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4400, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929541.457, "dur": 6.087, + "args": { + "External id": 234290,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929591.655, "dur": 1.487, + "args": { + "External id": 234291,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929608.731, "dur": 1.356, + "args": { + "External id": 234292,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929622.546, "dur": 1.103, + "args": { + "External id": 234293,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929634.294, "dur": 1.457, + "args": { + "External id": 234294,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929646.532, "dur": 0.986, + "args": { + "External id": 234295,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929694.904, "dur": 1.853, + "args": { + "External id": 234296,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929709.068, "dur": 1.311, + "args": { + "External id": 234297,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115929719.902, "dur": 1.119, + "args": { + "External id": 234298,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115929813.772, "dur": 2025.131, + "args": { + "External id": 234299,"Record function id": 0, "Ev Idx": 4410 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.0)", "pid": 4183442, "tid": 31331, + "ts": 667115929834.420, "dur": 402.592, + "args": { + "External id": 234300,"Record function id": 0, "Ev Idx": 4411 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 4183442, "tid": 31331, + "ts": 667115929849.110, "dur": 292.663, + "args": { + "External id": 234301,"Record function id": 0, "Ev Idx": 4412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929932.616, "dur": 4.426, + "args": { + "External id": 234302,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929940.350, "dur": 1.232, + "args": { + "External id": 234303,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929943.271, "dur": 1.535, + "args": { + "External id": 234304,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929946.693, "dur": 1.040, + "args": { + "External id": 234305,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929949.187, "dur": 1.285, + "args": { + "External id": 234306,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929952.279, "dur": 0.790, + "args": { + "External id": 234307,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929954.905, "dur": 1.269, + "args": { + "External id": 234308,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929957.520, "dur": 1.172, + "args": { + "External id": 234309,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929960.238, "dur": 1.758, + "args": { + "External id": 234310,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115929963.647, "dur": 1.584, + "args": { + "External id": 234311,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115929982.169, "dur": 133.808, + "args": { + "External id": 234312,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 31331, + "ts": 667115929997.983, "dur": 113.980, + "args": { + "External id": 234313,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115930010.301, "dur": 12.812, + "args": { + "External id": 234314,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115930025.644, "dur": 61.781, + "args": { + "External id": 234315,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115930028.662, "dur": 58.437, + "args": { + "External id": 234316,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115930032.477, "dur": 5.493, + "args": { + "External id": 234317,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115930039.706, "dur": 46.911, + "args": { + "External id": 234318,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115930243.851, "dur": 1571.814, + "args": { + "External id": 234319,"Sequence number": 2757746, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4430 + } + }, + { + "ph": "f", "id": 210, "pid": 4183442, "tid": 31331, "ts": 667115930243.851, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115930347.277, "dur": 95.183, + "args": { + "External id": 234320,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183442, "tid": 31331, + "ts": 667115930477.903, "dur": 59.753, + "args": { + "External id": 234321,"kernel_hash": "cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/ym/cymleroaygho35xdr4vv3vcbtafmyvjwchgalgzinbv65zukrlm3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183442, "tid": 31331, + "ts": 667115930557.824, "dur": 43.284, + "args": { + "External id": 234322,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115930610.879, "dur": 25.266, + "args": { + "External id": 234323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115930642.298, "dur": 73.984, + "args": { + "External id": 234324,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115930728.088, "dur": 27.190, + "args": { + "External id": 234325,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115930764.095, "dur": 28.905, + "args": { + "External id": 234326,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183442, "tid": 31331, + "ts": 667115930821.266, "dur": 24.267, + "args": { + "External id": 234327,"kernel_hash": "cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/jy/cjyjgz2jkfmqllsvaienwafxdkekayxh2xmhsjlc7qteyaov2i2x.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183442, "tid": 31331, + "ts": 667115930863.289, "dur": 28.376, + "args": { + "External id": 234328,"kernel_hash": "cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/n2/cn2dq73bvaua6jd3aqsfcig3emiah3nmddyxywudzqqadxenrwdu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115930910.304, "dur": 19.370, + "args": { + "External id": 234329,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115930942.034, "dur": 19.541, + "args": { + "External id": 234330,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115930970.635, "dur": 38.862, + "args": { + "External id": 234331,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115931013.072, "dur": 30.211, + "args": { + "External id": 234332,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183442, "tid": 31331, + "ts": 667115931069.597, "dur": 164.893, + "args": { + "External id": 234333,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115931139.705, "dur": 6.319, + "args": { + "External id": 234334,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115931147.881, "dur": 3.218, + "args": { + "External id": 234335,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115931268.845, "dur": 26.317, + "args": { + "External id": 234336,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 31331, + "ts": 667115931306.805, "dur": 13.889, + "args": { + "External id": 234337,"kernel_hash": "cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/pe/cpeyhcav2yhauamgtiarv5ao4h2jk77iwprlvpmyx2vrdaakqu4u.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115931329.025, "dur": 41.317, + "args": { + "External id": 234338,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115931376.629, "dur": 31.273, + "args": { + "External id": 234339,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115931414.536, "dur": 27.236, + "args": { + "External id": 234340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115931446.884, "dur": 30.874, + "args": { + "External id": 234341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115931483.237, "dur": 49.004, + "args": { + "External id": 234342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 31331, + "ts": 667115931543.150, "dur": 31.137, + "args": { + "External id": 234343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183442, "tid": 31331, + "ts": 667115931591.934, "dur": 23.914, + "args": { + "External id": 234344,"kernel_hash": "cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/md/cmdpl3fmzgwvlu4zjrj26na6s63vjzqdvg7uex53dnjeuzvbfif5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183442, "tid": 31331, + "ts": 667115931633.336, "dur": 59.498, + "args": { + "External id": 234345,"kernel_hash": "cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/is/cisiydiq3pkh2eayiijunpynfugwes22eick37xty632mhbuxc33.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183442, "tid": 31331, + "ts": 667115931710.963, "dur": 18.494, + "args": { + "External id": 234346,"kernel_hash": "ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tv/ctvkswplemxk7vi3fhouphohrimozy5qt6yu33yve7d7kpusmluq.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183442, "tid": 31331, + "ts": 667115931745.001, "dur": 14.816, + "args": { + "External id": 234347,"kernel_hash": "cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ef/cef4y3prmbiy72fask5ogsa7p3maswpi5cur54twrqqbw7624ada.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183442, "tid": 31331, + "ts": 667115931771.724, "dur": 15.074, + "args": { + "External id": 234348,"kernel_hash": "cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/fw/cfwqczljqvqqdvqa2imyrah4emx4utdw6xfehx2a4lfjhqcgn7q5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931859.378, "dur": 16.894, + "args": { + "External id": 234349,"Record function id": 0, "Ev Idx": 4460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931863.167, "dur": 12.191, + "args": { + "External id": 234350,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931867.342, "dur": 7.073, + "args": { + "External id": 234351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931868.774, "dur": 5.526, + "args": { + "External id": 234352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931880.195, "dur": 5.344, + "args": { + "External id": 234353,"Record function id": 0, "Ev Idx": 4464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931881.538, "dur": 3.542, + "args": { + "External id": 234354,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931882.839, "dur": 1.779, + "args": { + "External id": 234355,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931883.404, "dur": 1.096, + "args": { + "External id": 234356,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931888.958, "dur": 5.139, + "args": { + "External id": 234357,"Record function id": 0, "Ev Idx": 4468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931890.590, "dur": 3.088, + "args": { + "External id": 234358,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931891.238, "dur": 2.037, + "args": { + "External id": 234359,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931892.199, "dur": 0.982, + "args": { + "External id": 234360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931897.442, "dur": 5.108, + "args": { + "External id": 234361,"Record function id": 0, "Ev Idx": 4472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931899.442, "dur": 2.649, + "args": { + "External id": 234362,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931900.095, "dur": 1.427, + "args": { + "External id": 234363,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931900.735, "dur": 0.714, + "args": { + "External id": 234364,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931905.645, "dur": 5.231, + "args": { + "External id": 234365,"Record function id": 0, "Ev Idx": 4476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931907.424, "dur": 2.986, + "args": { + "External id": 234366,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931908.285, "dur": 1.708, + "args": { + "External id": 234367,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931908.844, "dur": 1.067, + "args": { + "External id": 234368,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931913.886, "dur": 4.524, + "args": { + "External id": 234369,"Record function id": 0, "Ev Idx": 4480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931915.708, "dur": 2.258, + "args": { + "External id": 234370,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931916.260, "dur": 1.313, + "args": { + "External id": 234371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931916.867, "dur": 0.624, + "args": { + "External id": 234372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931921.644, "dur": 4.339, + "args": { + "External id": 234373,"Record function id": 0, "Ev Idx": 4484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931923.159, "dur": 2.410, + "args": { + "External id": 234374,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931923.782, "dur": 1.340, + "args": { + "External id": 234375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931924.116, "dur": 0.940, + "args": { + "External id": 234376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931929.079, "dur": 4.616, + "args": { + "External id": 234377,"Record function id": 0, "Ev Idx": 4488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931930.926, "dur": 2.309, + "args": { + "External id": 234378,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931931.664, "dur": 1.192, + "args": { + "External id": 234379,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931932.040, "dur": 0.753, + "args": { + "External id": 234380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931936.902, "dur": 4.654, + "args": { + "External id": 234381,"Record function id": 0, "Ev Idx": 4492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115931938.276, "dur": 2.861, + "args": { + "External id": 234382,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115931939.023, "dur": 1.714, + "args": { + "External id": 234383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115931939.753, "dur": 0.922, + "args": { + "External id": 234384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115931945.689, "dur": 15397.034, + "args": { + "External id": 234385,"Record function id": 0, "Sequence number": 2757745, "Fwd thread id": 1, "Ev Idx": 4496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115931947.206, "dur": 15386.958, + "args": { + "External id": 234386,"Sequence number": 2757745, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4497 + } + }, + { + "ph": "f", "id": 211, "pid": 4183442, "tid": 31331, "ts": 667115931947.206, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.0)", "pid": 4183442, "tid": 31331, + "ts": 667115931976.255, "dur": 38.027, + "args": { + "External id": 234387,"Record function id": 0, "Ev Idx": 4498 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.0)", "pid": 4183442, "tid": 31331, + "ts": 667115932021.801, "dur": 75.111, + "args": { + "External id": 234388,"Record function id": 0, "Ev Idx": 4499 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.0)", "pid": 4183442, "tid": 31331, + "ts": 667115932102.778, "dur": 15224.091, + "args": { + "External id": 234389,"Record function id": 0, "Ev Idx": 4500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115932201.400, "dur": 8.802, + "args": { + "External id": 234390,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115932223.740, "dur": 5.165, + "args": { + "External id": 234391,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115932242.551, "dur": 14468.264, + "args": { + "External id": 234392,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115932255.722, "dur": 14447.317, + "args": { + "External id": 234393,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115932282.806, "dur": 13.866, + "args": { + "External id": 234394,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115932300.600, "dur": 14341.979, + "args": { + "External id": 234395,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115932302.915, "dur": 14338.852, + "args": { + "External id": 234396,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115932307.088, "dur": 5.271, + "args": { + "External id": 234397,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115932313.824, "dur": 14324.794, + "args": { + "External id": 234398,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115946792.306, "dur": 9.358, + "args": { + "External id": 234399,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115946795.335, "dur": 6.000, + "args": { + "External id": 234400,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115946826.715, "dur": 236.904, + "args": { + "External id": 234401,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115946851.978, "dur": 207.639, + "args": { + "External id": 234402,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4513, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115946861.918, "dur": 192.416, + "args": { + "External id": 234403,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115947078.354, "dur": 1.809, + "args": { + "External id": 234404,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4515, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947126.982, "dur": 5.724, + "args": { + "External id": 234405,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947178.006, "dur": 1.552, + "args": { + "External id": 234406,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947195.186, "dur": 1.699, + "args": { + "External id": 234407,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947208.774, "dur": 0.918, + "args": { + "External id": 234408,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947220.064, "dur": 0.978, + "args": { + "External id": 234409,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947231.775, "dur": 0.812, + "args": { + "External id": 234410,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947244.015, "dur": 0.940, + "args": { + "External id": 234411,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947256.567, "dur": 1.075, + "args": { + "External id": 234412,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115947267.034, "dur": 1.034, + "args": { + "External id": 234413,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115947355.603, "dur": 283.980, + "args": { + "External id": 234414,"Record function id": 0, "Sequence number": 2757744, "Fwd thread id": 1, "Ev Idx": 4525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183442, "tid": 31331, + "ts": 667115947357.996, "dur": 273.071, + "args": { + "External id": 234415,"Sequence number": 2757744, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4526 + } + }, + { + "ph": "f", "id": 212, "pid": 4183442, "tid": 31331, "ts": 667115947357.996, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_0", "pid": 4183442, "tid": 31331, + "ts": 667115947475.424, "dur": 59.657, + "args": { + "External id": 234416,"kernel_hash": "c4wvcz6icn3qia6c3hm4xlywbrxxj3su5oefjj5tcccobmcqdffh", "grid": "grid(32768000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "32768000"], "kernel_file": "/tmp/torchinductor_cvm/4w/c4wvcz6icn3qia6c3hm4xlywbrxxj3su5oefjj5tcccobmcqdffh.py", "kernel_backend": "triton", "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 4527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_1", "pid": 4183442, "tid": 31331, + "ts": 667115947550.445, "dur": 27.791, + "args": { + "External id": 234417,"kernel_hash": "cpkuvyxwue4m6pukwwpmhfva4zggyzxnrhyfwi5kc6arz3vkfkgb", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/pk/cpkuvyxwue4m6pukwwpmhfva4zggyzxnrhyfwi5kc6arz3vkfkgb.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "float", "Scalar"], "Input Strides": [[4096, 1], [4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096], [16, 4096, 1024], [32000, 1024], []], "Ev Idx": 4528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_2", "pid": 4183442, "tid": 31331, + "ts": 667115947594.764, "dur": 21.407, + "args": { + "External id": 234418,"kernel_hash": "c4d5p2qstwhhpqnif6zd5ioc2pm5u242vfmznxzmzrlxasxyhpya", "grid": "grid(32768000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "32768000"], "kernel_file": "/tmp/torchinductor_cvm/4d/c4d5p2qstwhhpqnif6zd5ioc2pm5u242vfmznxzmzrlxasxyhpya.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 4529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115947650.909, "dur": 51.171, + "args": { + "External id": 234419,"Record function id": 0, "Ev Idx": 4530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183442, "tid": 31331, + "ts": 667115947689.654, "dur": 11.182, + "args": { + "External id": 234420,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 4531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 31331, + "ts": 667115947693.278, "dur": 6.189, + "args": { + "External id": 234421,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 4532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 31331, + "ts": 667115947694.768, "dur": 4.450, + "args": { + "External id": 234422,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 4533 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::root_post_backward_callback", "pid": 4183442, "tid": 31331, + "ts": 667115947727.186, "dur": 7738.791, + "args": { + "External id": 234423,"Record function id": 0, "Ev Idx": 4534 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate", "pid": 4183442, "tid": 31331, + "ts": 667115947746.416, "dur": 38.397, + "args": { + "External id": 234424,"Record function id": 0, "Ev Idx": 4535 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard", "pid": 4183442, "tid": 31331, + "ts": 667115947790.827, "dur": 260.304, + "args": { + "External id": 234425,"Record function id": 0, "Ev Idx": 4536 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce", "pid": 4183442, "tid": 31331, + "ts": 667115948056.850, "dur": 7206.549, + "args": { + "External id": 234426,"Record function id": 0, "Ev Idx": 4537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115948173.085, "dur": 7.145, + "args": { + "External id": 234427,"Record function id": 0, "Concrete Inputs": ["[116925440]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 31331, + "ts": 667115948190.510, "dur": 5.131, + "args": { + "External id": 234428,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[116925440], []], "Ev Idx": 4539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115948214.425, "dur": 5797.043, + "args": { + "External id": 234429,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [14615680, 1]], "Input Dims": [[], [], [], [8, 14615680]], "Ev Idx": 4540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183442, "tid": 31331, + "ts": 667115948231.762, "dur": 5768.738, + "args": { + "External id": 234430,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [14615680, 1]], "Input Dims": [[], [], [], [8, 14615680]], "Ev Idx": 4541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115948327.481, "dur": 14.139, + "args": { + "External id": 234431,"Record function id": 0, "Concrete Inputs": ["[28789]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 31331, + "ts": 667115948374.721, "dur": 5587.059, + "args": { + "External id": 234432,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[28789], [], [], [], [], [], [], []], "Ev Idx": 4543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 31331, + "ts": 667115948377.127, "dur": 5583.899, + "args": { + "External id": 234433,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[28789], [], [], [], [], [], []], "Ev Idx": 4544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 31331, + "ts": 667115948381.082, "dur": 5.687, + "args": { + "External id": 234434,"Record function id": 0, "Concrete Inputs": ["[28789]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 31331, + "ts": 667115948388.582, "dur": 5568.393, + "args": { + "External id": 234435,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[28789], [28789], []], "Ev Idx": 4546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 31331, + "ts": 667115954132.292, "dur": 9.363, + "args": { + "External id": 234436,"Record function id": 0, "Concrete Inputs": ["", "[14615680]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[116925440], [], [], [], [], []], "Ev Idx": 4547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 31331, + "ts": 667115954135.136, "dur": 6.181, + "args": { + "External id": 234437,"Record function id": 0, "Concrete Inputs": ["[14615680]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183442, "tid": 31331, + "ts": 667115954170.749, "dur": 430.906, + "args": { + "External id": 234438,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[14615680], [116925440], [], [], [], []], "Ev Idx": 4549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115954195.465, "dur": 400.942, + "args": { + "External id": 234439,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 14615680, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[116925440], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4550, "In msg nelems": 116925440 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183442, "tid": 31331, + "ts": 667115954206.199, "dur": 385.008, + "args": { + "External id": 234440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[116925440]], "Ev Idx": 4551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 31331, + "ts": 667115954627.267, "dur": 2.291, + "args": { + "External id": 234441,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4552, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954723.511, "dur": 7.231, + "args": { + "External id": 234442,"Record function id": 0, "Concrete Inputs": ["", "[4000, 1024]", "[1024, 1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954776.207, "dur": 1.713, + "args": { + "External id": 234443,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4096000"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954794.021, "dur": 1.385, + "args": { + "External id": 234444,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4096128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954807.901, "dur": 0.857, + "args": { + "External id": 234445,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4227200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954819.828, "dur": 1.314, + "args": { + "External id": 234446,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4358272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954831.317, "dur": 1.527, + "args": { + "External id": 234447,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4489344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954843.056, "dur": 1.534, + "args": { + "External id": 234448,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4620416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954855.325, "dur": 1.291, + "args": { + "External id": 234449,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "4620544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954866.767, "dur": 1.520, + "args": { + "External id": 234450,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "4980992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954878.315, "dur": 1.041, + "args": { + "External id": 234451,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "5341440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954889.619, "dur": 1.472, + "args": { + "External id": 234452,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "5701888"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954900.812, "dur": 1.607, + "args": { + "External id": 234453,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "5702016"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954912.443, "dur": 1.602, + "args": { + "External id": 234454,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "5833088"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954923.208, "dur": 1.550, + "args": { + "External id": 234455,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "5964160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954934.010, "dur": 1.457, + "args": { + "External id": 234456,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "6095232"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954945.069, "dur": 1.412, + "args": { + "External id": 234457,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "6226304"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954955.945, "dur": 1.613, + "args": { + "External id": 234458,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "6226432"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954966.715, "dur": 1.325, + "args": { + "External id": 234459,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "6586880"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954977.476, "dur": 1.508, + "args": { + "External id": 234460,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "6947328"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954988.189, "dur": 1.329, + "args": { + "External id": 234461,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7307776"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115954998.600, "dur": 1.336, + "args": { + "External id": 234462,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7307904"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955010.015, "dur": 1.681, + "args": { + "External id": 234463,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7438976"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955021.078, "dur": 1.369, + "args": { + "External id": 234464,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7570048"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955031.582, "dur": 1.165, + "args": { + "External id": 234465,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7701120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955042.288, "dur": 1.606, + "args": { + "External id": 234466,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7832192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955053.588, "dur": 1.326, + "args": { + "External id": 234467,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "7832320"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955063.893, "dur": 1.635, + "args": { + "External id": 234468,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "8192768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955074.237, "dur": 1.618, + "args": { + "External id": 234469,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "8553216"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955085.556, "dur": 1.619, + "args": { + "External id": 234470,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8913664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955097.098, "dur": 1.376, + "args": { + "External id": 234471,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "8913792"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955107.870, "dur": 1.797, + "args": { + "External id": 234472,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "9044864"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955119.135, "dur": 1.408, + "args": { + "External id": 234473,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "9175936"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955129.896, "dur": 2.114, + "args": { + "External id": 234474,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "9307008"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955141.189, "dur": 1.106, + "args": { + "External id": 234475,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9438080"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955151.479, "dur": 1.190, + "args": { + "External id": 234476,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "9438208"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955162.783, "dur": 1.335, + "args": { + "External id": 234477,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "9798656"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955174.706, "dur": 1.462, + "args": { + "External id": 234478,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "10159104"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955186.882, "dur": 1.516, + "args": { + "External id": 234479,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10519552"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 31331, + "ts": 667115955199.623, "dur": 1.787, + "args": { + "External id": 234480,"Record function id": 0, "Concrete Inputs": ["", "[4000, 1024]", "[1024, 1]", "10519680"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4591 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "ProfilerStep#12287", "pid": 4183442, "tid": 4183442, + "ts": 667115183062.121, "dur": 786558.679, + "args": { + "External id": 225793,"Record function id": 0, "Ev Idx": 4592 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "Optimizer.zero_grad#AdamW.zero_grad", "pid": 4183442, "tid": 4183442, + "ts": 667115183094.363, "dur": 492.391, + "args": { + "External id": 225794,"Record function id": 0, "Ev Idx": 4593 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "enumerate(DataLoader)#_StatefulMultiProcessingDataLoaderIter.__next__", "pid": 4183442, "tid": 4183442, + "ts": 667115183626.722, "dur": 2131.974, + "args": { + "External id": 225795,"Record function id": 0, "Ev Idx": 4594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115184683.202, "dur": 8.104, + "args": { + "External id": 225796,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 4183442, "tid": 4183442, + "ts": 667115184711.942, "dur": 6.674, + "args": { + "External id": 225797,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 4596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115185179.761, "dur": 2.232, + "args": { + "External id": 225798,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 4183442, "tid": 4183442, + "ts": 667115185189.515, "dur": 2.473, + "args": { + "External id": 225799,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 4598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115185617.922, "dur": 1.667, + "args": { + "External id": 225800,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 4183442, "tid": 4183442, + "ts": 667115185627.160, "dur": 2.255, + "args": { + "External id": 225801,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 4600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115186282.452, "dur": 13.232, + "args": { + "External id": 225802,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 4601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115186289.411, "dur": 2.305, + "args": { + "External id": 225803,"Record function id": 0, "Concrete Inputs": ["", "[16, 8192]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 4602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115186297.405, "dur": 4.430, + "args": { + "External id": 225804,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 4603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115186299.892, "dur": 0.923, + "args": { + "External id": 225805,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 4604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115186326.652, "dur": 556.084, + "args": { + "External id": 225806,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], [], []], "Ev Idx": 4605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115186334.017, "dur": 547.814, + "args": { + "External id": 225807,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 4606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115186342.683, "dur": 9.905, + "args": { + "External id": 225808,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115186354.922, "dur": 525.475, + "args": { + "External id": 225809,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115186364.292, "dur": 0.432, + "args": { + "External id": 225810,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 4609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 4183442, "tid": 4183442, + "ts": 667115186367.263, "dur": 9.092, + "args": { + "External id": 225811,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[8192, 1], [4096, 1]], "Input Dims": [[16, 4096], [16, 4096]], "Ev Idx": 4610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 4183442, "tid": 4183442, + "ts": 667115186372.641, "dur": 3.562, + "args": { + "External id": 225812,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], []], "Input Dims": [[16, 4096], [], []], "Ev Idx": 4611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115186375.461, "dur": 0.496, + "args": { + "External id": 225813,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 4612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115186378.481, "dur": 216.506, + "args": { + "External id": 225814,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 4613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115186381.121, "dur": 213.481, + "args": { + "External id": 225815,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 4614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115186383.548, "dur": 15.569, + "args": { + "External id": 225816,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 4615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115186386.027, "dur": 12.641, + "args": { + "External id": 225817,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115186399.997, "dur": 193.819, + "args": { + "External id": 225818,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115186597.784, "dur": 278.098, + "args": { + "External id": 225819,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115186901.808, "dur": 449.332, + "args": { + "External id": 225820,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 4619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115186904.313, "dur": 445.976, + "args": { + "External id": 225821,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], []], "Ev Idx": 4620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115186911.455, "dur": 8.399, + "args": { + "External id": 225822,"Record function id": 0, "Concrete Inputs": ["[16, 8192]", "[8192, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115186921.131, "dur": 426.991, + "args": { + "External id": 225823,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[8192, 1], [8192, 1], []], "Input Dims": [[16, 8192], [16, 8192], []], "Ev Idx": 4622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 4183442, "tid": 4183442, + "ts": 667115187375.038, "dur": 50.048, + "args": { + "External id": 225824,"Record function id": 0, "Concrete Inputs": ["0", "4096", "", "", "", "False"], "Input type": ["Scalar", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115187379.481, "dur": 4.639, + "args": { + "External id": 225825,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 4183442, "tid": 4183442, + "ts": 667115187386.617, "dur": 38.075, + "args": { + "External id": 225826,"Record function id": 0, "Concrete Inputs": ["0", "4096", "1", ""], "Input type": ["Scalar", "Scalar", "Scalar", "long int"], "Input Strides": [[], [], [], [1]], "Input Dims": [[], [], [], [0]], "Ev Idx": 4625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115187391.444, "dur": 6.078, + "args": { + "External id": 225827,"Record function id": 0, "Concrete Inputs": ["", "[4096]", ""], "Input type": ["long int", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 4626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::repeat", "pid": 4183442, "tid": 4183442, + "ts": 667115187437.708, "dur": 89.676, + "args": { + "External id": 225828,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4096], []], "Ev Idx": 4627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 4183442, "tid": 4183442, + "ts": 667115187442.143, "dur": 6.988, + "args": { + "External id": 225829,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[4096], [], []], "Ev Idx": 4628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115187447.066, "dur": 1.797, + "args": { + "External id": 225830,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "[4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[4096], [], [], []], "Ev Idx": 4629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115187450.098, "dur": 5.134, + "args": { + "External id": 225831,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 4183442, + "ts": 667115187460.105, "dur": 3.579, + "args": { + "External id": 225832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[4096, 1]], "Input Dims": [[16, 4096]], "Ev Idx": 4631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 4183442, "tid": 4183442, + "ts": 667115187466.210, "dur": 6.055, + "args": { + "External id": 225833,"Record function id": 0, "Concrete Inputs": ["", "0", "1", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 4632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115187470.992, "dur": 1.150, + "args": { + "External id": 225834,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1]", "[4096, 1, 4096]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 4633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 4183442, "tid": 4183442, + "ts": 667115187473.012, "dur": 5.254, + "args": { + "External id": 225835,"Record function id": 0, "Concrete Inputs": ["", "1", "4096", "4096"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 4634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115187477.002, "dur": 1.177, + "args": { + "External id": 225836,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[4096, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 4635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 4183442, "tid": 4183442, + "ts": 667115187479.948, "dur": 3.820, + "args": { + "External id": 225837,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[4096, 1], [4096, 4096, 4096, 1]], "Input Dims": [[1, 4096], [16, 1, 1, 4096]], "Ev Idx": 4636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 4183442, "tid": 4183442, + "ts": 667115187481.169, "dur": 2.477, + "args": { + "External id": 225838,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[4096, 1], [], []], "Input Dims": [[1, 4096], [], []], "Ev Idx": 4637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115187482.481, "dur": 1.064, + "args": { + "External id": 225839,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[0, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[1, 4096], [], [], []], "Ev Idx": 4638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115187484.531, "dur": 41.459, + "args": { + "External id": 225840,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 4096, 4096, 1], [0, 4096, 4096, 1], []], "Input Dims": [[16, 1, 1, 4096], [16, 1, 1, 4096], []], "Ev Idx": 4639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115187536.876, "dur": 33.829, + "args": { + "External id": 225841,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 4640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115187538.901, "dur": 31.631, + "args": { + "External id": 225842,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "", "", "", "False", ""], "Input type": ["long int", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 4641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115187547.201, "dur": 3.738, + "args": { + "External id": 225843,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "3", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115187551.686, "dur": 18.492, + "args": { + "External id": 225844,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4643 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::root_pre_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115187719.957, "dur": 156.862, + "args": { + "External id": 225845,"Record function id": 0, "Ev Idx": 4644 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::inputs_to_device", "pid": 4183442, "tid": 4183442, + "ts": 667115187805.695, "dur": 60.597, + "args": { + "External id": 225846,"Record function id": 0, "Ev Idx": 4645 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115187884.860, "dur": 42.908, + "args": { + "External id": 225847,"Record function id": 0, "Ev Idx": 4646 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115187936.034, "dur": 7857.551, + "args": { + "External id": 225848,"Record function id": 0, "Ev Idx": 4647 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather", "pid": 4183442, "tid": 4183442, + "ts": 667115187946.736, "dur": 1246.839, + "args": { + "External id": 225849,"Record function id": 0, "Ev Idx": 4648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115188067.489, "dur": 7.384, + "args": { + "External id": 225850,"Record function id": 0, "Concrete Inputs": ["[14615680]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115188092.561, "dur": 142.333, + "args": { + "External id": 225851,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[14615680], [], []], "Ev Idx": 4650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188097.633, "dur": 1.589, + "args": { + "External id": 225852,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188105.836, "dur": 0.428, + "args": { + "External id": 225853,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4096000"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188107.163, "dur": 0.457, + "args": { + "External id": 225854,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4096128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188108.514, "dur": 2.467, + "args": { + "External id": 225855,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4227200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188116.298, "dur": 0.564, + "args": { + "External id": 225856,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4358272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188117.800, "dur": 0.529, + "args": { + "External id": 225857,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4489344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188118.834, "dur": 2.653, + "args": { + "External id": 225858,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4620416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188124.537, "dur": 0.727, + "args": { + "External id": 225859,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "4620544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188125.951, "dur": 0.864, + "args": { + "External id": 225860,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "4980992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188131.824, "dur": 0.234, + "args": { + "External id": 225861,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "5341440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188132.948, "dur": 0.411, + "args": { + "External id": 225862,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "5701888"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188134.379, "dur": 1.680, + "args": { + "External id": 225863,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "5702016"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188141.488, "dur": 0.332, + "args": { + "External id": 225864,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "5833088"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188142.555, "dur": 0.364, + "args": { + "External id": 225865,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "5964160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188143.579, "dur": 2.175, + "args": { + "External id": 225866,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "6095232"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188149.137, "dur": 0.265, + "args": { + "External id": 225867,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "6226304"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188150.038, "dur": 0.426, + "args": { + "External id": 225868,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "6226432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188155.491, "dur": 0.277, + "args": { + "External id": 225869,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "6586880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188156.582, "dur": 0.361, + "args": { + "External id": 225870,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "6947328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188157.800, "dur": 1.736, + "args": { + "External id": 225871,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7307776"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188164.226, "dur": 0.412, + "args": { + "External id": 225872,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7307904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188165.284, "dur": 0.310, + "args": { + "External id": 225873,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7438976"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188166.258, "dur": 2.561, + "args": { + "External id": 225874,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7570048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188172.065, "dur": 0.277, + "args": { + "External id": 225875,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7701120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188172.966, "dur": 0.341, + "args": { + "External id": 225876,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7832192"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188177.947, "dur": 0.310, + "args": { + "External id": 225877,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "7832320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188178.907, "dur": 0.824, + "args": { + "External id": 225878,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8192768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188180.441, "dur": 2.294, + "args": { + "External id": 225879,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188187.455, "dur": 0.355, + "args": { + "External id": 225880,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8913664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188188.405, "dur": 0.267, + "args": { + "External id": 225881,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8913792"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188189.290, "dur": 2.042, + "args": { + "External id": 225882,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9044864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188194.685, "dur": 0.414, + "args": { + "External id": 225883,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9175936"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188195.890, "dur": 0.582, + "args": { + "External id": 225884,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9307008"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188201.735, "dur": 0.382, + "args": { + "External id": 225885,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9438080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188202.811, "dur": 0.419, + "args": { + "External id": 225886,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9438208"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188204.328, "dur": 2.235, + "args": { + "External id": 225887,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9798656"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188211.070, "dur": 0.176, + "args": { + "External id": 225888,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159104"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188211.914, "dur": 0.341, + "args": { + "External id": 225889,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10519552"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188212.873, "dur": 2.629, + "args": { + "External id": 225890,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "10519680"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115188262.407, "dur": 51.224, + "args": { + "External id": 225891,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 4690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115188390.038, "dur": 324.278, + "args": { + "External id": 225892,"Record function id": 0, "Concrete Inputs": ["", "", "14615680", "8", "6", "15", ""], "Input type": ["TensorList", "", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 4691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115188406.258, "dur": 4.589, + "args": { + "External id": 225893,"Record function id": 0, "Concrete Inputs": ["[116925440]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115188417.660, "dur": 13.278, + "args": { + "External id": 225894,"Record function id": 0, "Concrete Inputs": ["", "0", "87694080", "14615680"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[116925440], [], [], []], "Ev Idx": 4693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115188422.165, "dur": 8.306, + "args": { + "External id": 225895,"Record function id": 0, "Concrete Inputs": ["", "0", "87694080", "102309760", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[116925440], [], [], [], []], "Ev Idx": 4694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188427.136, "dur": 0.790, + "args": { + "External id": 225896,"Record function id": 0, "Concrete Inputs": ["", "[14615680]", "[1]", "87694080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[116925440], [], [], []], "Ev Idx": 4695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115188438.600, "dur": 156.467, + "args": { + "External id": 225897,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[14615680], [], []], "Ev Idx": 4696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188440.338, "dur": 0.630, + "args": { + "External id": 225898,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "87694080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188442.449, "dur": 0.708, + "args": { + "External id": 225899,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "91790080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188453.280, "dur": 2.930, + "args": { + "External id": 225900,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "91790208"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188457.196, "dur": 0.695, + "args": { + "External id": 225901,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "91921280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188460.713, "dur": 0.440, + "args": { + "External id": 225902,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "92052352"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188461.972, "dur": 0.548, + "args": { + "External id": 225903,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "92183424"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188463.677, "dur": 0.535, + "args": { + "External id": 225904,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "92314496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188467.733, "dur": 0.822, + "args": { + "External id": 225905,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "92314624"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188469.291, "dur": 1.655, + "args": { + "External id": 225906,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "92675072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188472.129, "dur": 0.633, + "args": { + "External id": 225907,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "93035520"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188476.844, "dur": 2.193, + "args": { + "External id": 225908,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "93395968"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188480.336, "dur": 0.228, + "args": { + "External id": 225909,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "93396096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188483.305, "dur": 2.881, + "args": { + "External id": 225910,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "93527168"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188487.023, "dur": 0.370, + "args": { + "External id": 225911,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "93658240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188487.957, "dur": 0.489, + "args": { + "External id": 225912,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "93789312"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188512.642, "dur": 0.764, + "args": { + "External id": 225913,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "93920384"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188514.496, "dur": 0.292, + "args": { + "External id": 225914,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "93920512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188515.362, "dur": 0.449, + "args": { + "External id": 225915,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "94280960"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188521.791, "dur": 2.006, + "args": { + "External id": 225916,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "94641408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188524.701, "dur": 0.243, + "args": { + "External id": 225917,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "95001856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188527.846, "dur": 2.386, + "args": { + "External id": 225918,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "95001984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188530.901, "dur": 0.805, + "args": { + "External id": 225919,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "95133056"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188532.260, "dur": 0.264, + "args": { + "External id": 225920,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "95264128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188537.340, "dur": 0.547, + "args": { + "External id": 225921,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "95395200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188538.460, "dur": 0.625, + "args": { + "External id": 225922,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "95526272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188540.026, "dur": 0.524, + "args": { + "External id": 225923,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "95526400"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188545.266, "dur": 1.967, + "args": { + "External id": 225924,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "95886848"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188548.100, "dur": 0.616, + "args": { + "External id": 225925,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "96247296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188551.288, "dur": 2.285, + "args": { + "External id": 225926,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "96607744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188554.324, "dur": 0.257, + "args": { + "External id": 225927,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "96607872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188555.306, "dur": 0.341, + "args": { + "External id": 225928,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "96738944"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188561.397, "dur": 0.343, + "args": { + "External id": 225929,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "96870016"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188562.466, "dur": 0.333, + "args": { + "External id": 225930,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "97001088"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188563.532, "dur": 0.262, + "args": { + "External id": 225931,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "97132160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188568.799, "dur": 1.968, + "args": { + "External id": 225932,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "97132288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188571.372, "dur": 0.177, + "args": { + "External id": 225933,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "97492736"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188574.086, "dur": 2.626, + "args": { + "External id": 225934,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "97853184"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188577.356, "dur": 0.273, + "args": { + "External id": 225935,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "98213632"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115188578.255, "dur": 0.144, + "args": { + "External id": 225936,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "98213760"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115188622.730, "dur": 72.799, + "args": { + "External id": 225937,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 4736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115188776.835, "dur": 310.941, + "args": { + "External id": 225938,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[116925440], [14615680], [], [], []], "Ev Idx": 4737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115188811.755, "dur": 271.474, + "args": { + "External id": 225939,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 116925440, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[14615680], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4738, "In msg nelems": 14615680 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115188823.081, "dur": 254.784, + "args": { + "External id": 225940,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[14615680]], "Ev Idx": 4739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115189112.967, "dur": 2.172, + "args": { + "External id": 225941,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4740, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out", "pid": 4183442, "tid": 4183442, + "ts": 667115189209.535, "dur": 6341.045, + "args": { + "External id": 225942,"Record function id": 0, "Ev Idx": 4741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189426.173, "dur": 6.190, + "args": { + "External id": 225943,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[116925440], []], "Ev Idx": 4742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189435.938, "dur": 1.743, + "args": { + "External id": 225944,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[32768000], []], "Ev Idx": 4743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189439.411, "dur": 1.548, + "args": { + "External id": 225945,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189442.827, "dur": 3.022, + "args": { + "External id": 225946,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189449.288, "dur": 1.147, + "args": { + "External id": 225947,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189452.036, "dur": 1.159, + "args": { + "External id": 225948,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189454.763, "dur": 1.087, + "args": { + "External id": 225949,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189457.247, "dur": 2.420, + "args": { + "External id": 225950,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189466.048, "dur": 1.057, + "args": { + "External id": 225951,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189468.718, "dur": 1.000, + "args": { + "External id": 225952,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189471.202, "dur": 1.287, + "args": { + "External id": 225953,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189473.956, "dur": 3.224, + "args": { + "External id": 225954,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189480.810, "dur": 1.088, + "args": { + "External id": 225955,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189483.250, "dur": 1.372, + "args": { + "External id": 225956,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189485.925, "dur": 0.831, + "args": { + "External id": 225957,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189487.871, "dur": 20.941, + "args": { + "External id": 225958,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189517.878, "dur": 1.249, + "args": { + "External id": 225959,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189520.547, "dur": 1.157, + "args": { + "External id": 225960,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189523.209, "dur": 0.649, + "args": { + "External id": 225961,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189525.389, "dur": 2.849, + "args": { + "External id": 225962,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189532.355, "dur": 0.952, + "args": { + "External id": 225963,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189534.668, "dur": 1.191, + "args": { + "External id": 225964,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189537.262, "dur": 0.667, + "args": { + "External id": 225965,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189539.452, "dur": 2.482, + "args": { + "External id": 225966,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189561.530, "dur": 0.956, + "args": { + "External id": 225967,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189563.743, "dur": 0.997, + "args": { + "External id": 225968,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189566.343, "dur": 0.998, + "args": { + "External id": 225969,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189568.671, "dur": 1.975, + "args": { + "External id": 225970,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189574.886, "dur": 0.998, + "args": { + "External id": 225971,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189577.296, "dur": 1.357, + "args": { + "External id": 225972,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189580.058, "dur": 0.908, + "args": { + "External id": 225973,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189582.095, "dur": 2.128, + "args": { + "External id": 225974,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189590.298, "dur": 1.070, + "args": { + "External id": 225975,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189592.644, "dur": 0.949, + "args": { + "External id": 225976,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189594.892, "dur": 0.973, + "args": { + "External id": 225977,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189597.314, "dur": 2.835, + "args": { + "External id": 225978,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189603.805, "dur": 1.273, + "args": { + "External id": 225979,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189606.459, "dur": 1.126, + "args": { + "External id": 225980,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189608.940, "dur": 0.752, + "args": { + "External id": 225981,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115189610.927, "dur": 1.711, + "args": { + "External id": 225982,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[32768000], []], "Ev Idx": 4781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115189645.364, "dur": 5837.291, + "args": { + "External id": 225983,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[14615680, 1], [], [], []], "Input Dims": [[8, 14615680], [], [], []], "Ev Idx": 4782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115189707.814, "dur": 5765.538, + "args": { + "External id": 225984,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[14615680, 1], [], [], []], "Input Dims": [[8, 14615680], [], [], []], "Ev Idx": 4783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115189731.884, "dur": 6.380, + "args": { + "External id": 225985,"Record function id": 0, "Concrete Inputs": ["[3034]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115189743.837, "dur": 5691.522, + "args": { + "External id": 225986,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3034], [], [], [], [], [], [], []], "Ev Idx": 4785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115189746.585, "dur": 5688.258, + "args": { + "External id": 225987,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3034], [], [], [], [], [], []], "Ev Idx": 4786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115189753.758, "dur": 7.353, + "args": { + "External id": 225988,"Record function id": 0, "Concrete Inputs": ["[3034]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115189762.737, "dur": 5668.708, + "args": { + "External id": 225989,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3034], [3034], []], "Ev Idx": 4788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115195878.106, "dur": 41.492, + "args": { + "External id": 225990,"Record function id": 0, "Ev Idx": 4789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 0/0", "pid": 4183442, "tid": 4183442, + "ts": 667115195921.181, "dur": 214.586, + "args": { + "External id": 225991,"Record function id": 0, "Ev Idx": 4790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115195965.862, "dur": 160.909, + "args": { + "External id": 225992,"Sequence number": 2757744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "long int"], "Input Strides": [[1024, 1], [4096, 1]], "Input Dims": [[32000, 1024], [16, 4096]], "Ev Idx": 4791 + } + }, + { + "ph": "s", "id": 212, "pid": 4183442, "tid": 4183442, "ts": 667115195965.862, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_0", "pid": 4183442, "tid": 4183442, + "ts": 667115196041.010, "dur": 47.217, + "args": { + "External id": 225993,"kernel_hash": "ce3wbgogff3cdlh46bywvlndcayoay5bk3ta62253xatokvf2jsx", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/e3/ce3wbgogff3cdlh46bywvlndcayoay5bk3ta62253xatokvf2jsx.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096], [32000, 1024], [16, 4096, 1024], []], "Ev Idx": 4792 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115196195.362, "dur": 54.459, + "args": { + "External id": 225994,"Record function id": 0, "Ev Idx": 4793 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.0)", "pid": 4183442, "tid": 4183442, + "ts": 667115196260.515, "dur": 6965.553, + "args": { + "External id": 225995,"Record function id": 0, "Ev Idx": 4794 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 4183442, "tid": 4183442, + "ts": 667115196269.358, "dur": 892.387, + "args": { + "External id": 225996,"Record function id": 0, "Ev Idx": 4795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115196346.323, "dur": 10.021, + "args": { + "External id": 225997,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115196369.994, "dur": 46.095, + "args": { + "External id": 225998,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196379.449, "dur": 2.132, + "args": { + "External id": 225999,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196383.291, "dur": 0.887, + "args": { + "External id": 226000,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196384.950, "dur": 3.087, + "args": { + "External id": 226001,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196391.125, "dur": 0.606, + "args": { + "External id": 226002,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196392.435, "dur": 0.855, + "args": { + "External id": 226003,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196396.061, "dur": 0.657, + "args": { + "External id": 226004,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196399.443, "dur": 0.235, + "args": { + "External id": 226005,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196400.585, "dur": 2.679, + "args": { + "External id": 226006,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196408.878, "dur": 0.276, + "args": { + "External id": 226007,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115196426.323, "dur": 36.080, + "args": { + "External id": 226008,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115196513.770, "dur": 122.150, + "args": { + "External id": 226009,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115196525.830, "dur": 6.709, + "args": { + "External id": 226010,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115196537.811, "dur": 12.452, + "args": { + "External id": 226011,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115196541.918, "dur": 7.931, + "args": { + "External id": 226012,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196547.313, "dur": 0.827, + "args": { + "External id": 226013,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115196557.374, "dur": 29.716, + "args": { + "External id": 226014,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196559.209, "dur": 0.642, + "args": { + "External id": 226015,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196563.336, "dur": 0.291, + "args": { + "External id": 226016,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196566.576, "dur": 0.520, + "args": { + "External id": 226017,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196567.856, "dur": 0.407, + "args": { + "External id": 226018,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196571.240, "dur": 2.695, + "args": { + "External id": 226019,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196574.576, "dur": 0.563, + "args": { + "External id": 226020,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196577.737, "dur": 0.223, + "args": { + "External id": 226021,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196580.937, "dur": 0.361, + "args": { + "External id": 226022,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115196581.955, "dur": 0.512, + "args": { + "External id": 226023,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115196600.801, "dur": 26.168, + "args": { + "External id": 226024,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115196730.916, "dur": 336.545, + "args": { + "External id": 226025,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115196762.550, "dur": 299.913, + "args": { + "External id": 226026,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4825, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115196774.019, "dur": 282.065, + "args": { + "External id": 226027,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115197091.192, "dur": 2.160, + "args": { + "External id": 226028,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4827, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 4183442, "tid": 4183442, + "ts": 667115197183.108, "dur": 5841.127, + "args": { + "External id": 226029,"Record function id": 0, "Ev Idx": 4828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197288.194, "dur": 6.413, + "args": { + "External id": 226030,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197297.547, "dur": 1.726, + "args": { + "External id": 226031,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197301.061, "dur": 1.496, + "args": { + "External id": 226032,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197304.291, "dur": 2.812, + "args": { + "External id": 226033,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197308.580, "dur": 1.429, + "args": { + "External id": 226034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197313.588, "dur": 1.240, + "args": { + "External id": 226035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197316.427, "dur": 1.196, + "args": { + "External id": 226036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197319.028, "dur": 1.827, + "args": { + "External id": 226037,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197324.153, "dur": 0.948, + "args": { + "External id": 226038,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115197328.549, "dur": 0.939, + "args": { + "External id": 226039,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115197346.039, "dur": 5642.754, + "args": { + "External id": 226040,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115197363.113, "dur": 5619.416, + "args": { + "External id": 226041,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115197385.018, "dur": 14.286, + "args": { + "External id": 226042,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115197402.778, "dur": 5549.760, + "args": { + "External id": 226043,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115197405.429, "dur": 5546.618, + "args": { + "External id": 226044,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115197410.730, "dur": 6.921, + "args": { + "External id": 226045,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115197419.305, "dur": 5529.698, + "args": { + "External id": 226046,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115203170.116, "dur": 32.379, + "args": { + "External id": 226047,"Sequence number": 2757745, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4846 + } + }, + { + "ph": "s", "id": 211, "pid": 4183442, "tid": 4183442, "ts": 667115203170.116, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115203187.731, "dur": 10.059, + "args": { + "External id": 226048,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 4847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115203193.123, "dur": 4.464, + "args": { + "External id": 226049,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 4848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115203266.266, "dur": 93.729, + "args": { + "External id": 226050,"Record function id": 0, "Ev Idx": 4849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115203361.759, "dur": 1215.796, + "args": { + "External id": 226051,"Record function id": 0, "Ev Idx": 4850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115203403.567, "dur": 1159.063, + "args": { + "External id": 226052,"Sequence number": 2757746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 4851 + } + }, + { + "ph": "s", "id": 210, "pid": 4183442, "tid": 4183442, "ts": 667115203403.567, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115203470.663, "dur": 62.658, + "args": { + "External id": 226053,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115203550.059, "dur": 95.030, + "args": { + "External id": 226054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115203728.932, "dur": 45.040, + "args": { + "External id": 226055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115203788.538, "dur": 31.178, + "args": { + "External id": 226056,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115203848.487, "dur": 29.610, + "args": { + "External id": 226057,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115203898.943, "dur": 14.134, + "args": { + "External id": 226058,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115203935.697, "dur": 135.763, + "args": { + "External id": 226059,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 4858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115203991.862, "dur": 11.846, + "args": { + "External id": 226060,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 4859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115203996.809, "dur": 6.177, + "args": { + "External id": 226061,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115204006.326, "dur": 3.446, + "args": { + "External id": 226062,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115204013.405, "dur": 1.306, + "args": { + "External id": 226063,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115204016.990, "dur": 2.448, + "args": { + "External id": 226064,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115204081.982, "dur": 47.745, + "args": { + "External id": 226065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115204165.009, "dur": 29.939, + "args": { + "External id": 226066,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115204202.998, "dur": 57.460, + "args": { + "External id": 226067,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115204270.858, "dur": 52.817, + "args": { + "External id": 226068,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115204345.569, "dur": 25.691, + "args": { + "External id": 226069,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 4868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115204377.494, "dur": 33.984, + "args": { + "External id": 226070,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115204437.851, "dur": 18.970, + "args": { + "External id": 226071,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 4870 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.0)", "pid": 4183442, "tid": 4183442, + "ts": 667115204644.696, "dur": 172.215, + "args": { + "External id": 226072,"Record function id": 0, "Ev Idx": 4871 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115204893.097, "dur": 46.256, + "args": { + "External id": 226073,"Record function id": 0, "Ev Idx": 4872 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.1)", "pid": 4183442, "tid": 4183442, + "ts": 667115204948.765, "dur": 8912.726, + "args": { + "External id": 226074,"Record function id": 0, "Ev Idx": 4873 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 4183442, "tid": 4183442, + "ts": 667115204958.341, "dur": 966.637, + "args": { + "External id": 226075,"Record function id": 0, "Ev Idx": 4874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115205044.955, "dur": 9.038, + "args": { + "External id": 226076,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115205066.889, "dur": 43.977, + "args": { + "External id": 226077,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205073.996, "dur": 2.330, + "args": { + "External id": 226078,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205077.983, "dur": 0.652, + "args": { + "External id": 226079,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205079.768, "dur": 0.956, + "args": { + "External id": 226080,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205086.162, "dur": 0.680, + "args": { + "External id": 226081,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205087.549, "dur": 2.900, + "args": { + "External id": 226082,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205093.098, "dur": 0.591, + "args": { + "External id": 226083,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205096.951, "dur": 0.524, + "args": { + "External id": 226084,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205098.323, "dur": 0.529, + "args": { + "External id": 226085,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205101.887, "dur": 2.381, + "args": { + "External id": 226086,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115205120.954, "dur": 45.836, + "args": { + "External id": 226087,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115205201.343, "dur": 120.349, + "args": { + "External id": 226088,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115205212.009, "dur": 3.956, + "args": { + "External id": 226089,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115205220.977, "dur": 12.625, + "args": { + "External id": 226090,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115205225.245, "dur": 7.950, + "args": { + "External id": 226091,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205230.845, "dur": 1.063, + "args": { + "External id": 226092,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115205240.159, "dur": 32.643, + "args": { + "External id": 226093,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205241.551, "dur": 0.670, + "args": { + "External id": 226094,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205245.828, "dur": 2.626, + "args": { + "External id": 226095,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205249.099, "dur": 2.962, + "args": { + "External id": 226096,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205254.810, "dur": 0.562, + "args": { + "External id": 226097,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205256.077, "dur": 0.779, + "args": { + "External id": 226098,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205259.644, "dur": 0.435, + "args": { + "External id": 226099,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205262.851, "dur": 0.741, + "args": { + "External id": 226100,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205264.296, "dur": 0.326, + "args": { + "External id": 226101,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115205267.848, "dur": 0.319, + "args": { + "External id": 226102,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115205287.310, "dur": 24.736, + "args": { + "External id": 226103,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115205375.570, "dur": 447.723, + "args": { + "External id": 226104,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115205407.328, "dur": 409.801, + "args": { + "External id": 226105,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4904, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115205418.542, "dur": 392.566, + "args": { + "External id": 226106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115205849.073, "dur": 3.035, + "args": { + "External id": 226107,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4906, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 4183442, "tid": 4183442, + "ts": 667115205946.768, "dur": 7660.350, + "args": { + "External id": 226108,"Record function id": 0, "Ev Idx": 4907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206080.590, "dur": 6.621, + "args": { + "External id": 226109,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206090.472, "dur": 2.449, + "args": { + "External id": 226110,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206094.514, "dur": 1.410, + "args": { + "External id": 226111,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206097.636, "dur": 1.154, + "args": { + "External id": 226112,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206100.117, "dur": 2.290, + "args": { + "External id": 226113,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206106.179, "dur": 1.575, + "args": { + "External id": 226114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206109.371, "dur": 1.237, + "args": { + "External id": 226115,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206114.480, "dur": 5.329, + "args": { + "External id": 226116,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206121.115, "dur": 1.092, + "args": { + "External id": 226117,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115206125.874, "dur": 0.973, + "args": { + "External id": 226118,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115206143.826, "dur": 7425.472, + "args": { + "External id": 226119,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115206161.626, "dur": 7401.293, + "args": { + "External id": 226120,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115206182.375, "dur": 14.836, + "args": { + "External id": 226121,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115206199.892, "dur": 7332.438, + "args": { + "External id": 226122,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115206202.555, "dur": 7329.180, + "args": { + "External id": 226123,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115206208.422, "dur": 5.388, + "args": { + "External id": 226124,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115206215.595, "dur": 7313.243, + "args": { + "External id": 226125,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115213802.750, "dur": 30.354, + "args": { + "External id": 226126,"Sequence number": 2757747, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4925 + } + }, + { + "ph": "s", "id": 209, "pid": 4183442, "tid": 4183442, "ts": 667115213802.750, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115213817.915, "dur": 10.550, + "args": { + "External id": 226127,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 4926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115213823.605, "dur": 4.482, + "args": { + "External id": 226128,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 4927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115213903.197, "dur": 91.745, + "args": { + "External id": 226129,"Record function id": 0, "Ev Idx": 4928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115213996.464, "dur": 1133.879, + "args": { + "External id": 226130,"Record function id": 0, "Ev Idx": 4929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115214036.562, "dur": 1080.457, + "args": { + "External id": 226131,"Sequence number": 2757748, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 4930 + } + }, + { + "ph": "s", "id": 208, "pid": 4183442, "tid": 4183442, "ts": 667115214036.562, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115214113.679, "dur": 41.897, + "args": { + "External id": 226132,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115214171.072, "dur": 88.237, + "args": { + "External id": 226133,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115214267.500, "dur": 33.394, + "args": { + "External id": 226134,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115214306.946, "dur": 29.229, + "args": { + "External id": 226135,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115214367.697, "dur": 25.222, + "args": { + "External id": 226136,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115214408.186, "dur": 17.328, + "args": { + "External id": 226137,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115214440.303, "dur": 179.537, + "args": { + "External id": 226138,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 4937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115214530.726, "dur": 16.599, + "args": { + "External id": 226139,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 4938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115214535.430, "dur": 10.935, + "args": { + "External id": 226140,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115214552.085, "dur": 4.100, + "args": { + "External id": 226141,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115214557.343, "dur": 4.295, + "args": { + "External id": 226142,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115214563.923, "dur": 2.346, + "args": { + "External id": 226143,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115214631.128, "dur": 101.967, + "args": { + "External id": 226144,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115214769.831, "dur": 28.762, + "args": { + "External id": 226145,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115214807.863, "dur": 57.547, + "args": { + "External id": 226146,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115214872.705, "dur": 43.539, + "args": { + "External id": 226147,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115214941.372, "dur": 26.597, + "args": { + "External id": 226148,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 4947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115214974.018, "dur": 36.580, + "args": { + "External id": 226149,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115215029.141, "dur": 20.149, + "args": { + "External id": 226150,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 4949 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.1)", "pid": 4183442, "tid": 4183442, + "ts": 667115215194.256, "dur": 83.198, + "args": { + "External id": 226151,"Record function id": 0, "Ev Idx": 4950 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115215350.778, "dur": 48.593, + "args": { + "External id": 226152,"Record function id": 0, "Ev Idx": 4951 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.2)", "pid": 4183442, "tid": 4183442, + "ts": 667115215408.298, "dur": 9195.841, + "args": { + "External id": 226153,"Record function id": 0, "Ev Idx": 4952 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 4183442, "tid": 4183442, + "ts": 667115215419.826, "dur": 945.305, + "args": { + "External id": 226154,"Record function id": 0, "Ev Idx": 4953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115215530.706, "dur": 9.111, + "args": { + "External id": 226155,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115215553.652, "dur": 42.664, + "args": { + "External id": 226156,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215561.357, "dur": 2.125, + "args": { + "External id": 226157,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215568.596, "dur": 0.456, + "args": { + "External id": 226158,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215571.824, "dur": 0.506, + "args": { + "External id": 226159,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215573.211, "dur": 0.729, + "args": { + "External id": 226160,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215576.878, "dur": 0.533, + "args": { + "External id": 226161,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215579.986, "dur": 1.035, + "args": { + "External id": 226162,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215581.727, "dur": 3.160, + "args": { + "External id": 226163,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215585.623, "dur": 0.727, + "args": { + "External id": 226164,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215588.923, "dur": 0.287, + "args": { + "External id": 226165,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115215607.179, "dur": 43.125, + "args": { + "External id": 226166,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115215729.522, "dur": 125.247, + "args": { + "External id": 226167,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115215745.316, "dur": 4.992, + "args": { + "External id": 226168,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115215755.640, "dur": 10.886, + "args": { + "External id": 226169,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115215760.216, "dur": 5.907, + "args": { + "External id": 226170,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215763.308, "dur": 1.247, + "args": { + "External id": 226171,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115215772.799, "dur": 36.050, + "args": { + "External id": 226172,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215776.654, "dur": 3.041, + "args": { + "External id": 226173,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215780.548, "dur": 0.680, + "args": { + "External id": 226174,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215781.837, "dur": 0.637, + "args": { + "External id": 226175,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215787.524, "dur": 2.000, + "args": { + "External id": 226176,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215790.168, "dur": 0.353, + "args": { + "External id": 226177,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215791.117, "dur": 0.378, + "args": { + "External id": 226178,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215796.841, "dur": 0.376, + "args": { + "External id": 226179,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215797.890, "dur": 0.350, + "args": { + "External id": 226180,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115215801.055, "dur": 2.472, + "args": { + "External id": 226181,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115215819.052, "dur": 27.593, + "args": { + "External id": 226182,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115215909.242, "dur": 367.670, + "args": { + "External id": 226183,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115215945.494, "dur": 326.425, + "args": { + "External id": 226184,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4983, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115215955.380, "dur": 310.765, + "args": { + "External id": 226185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115216297.894, "dur": 2.455, + "args": { + "External id": 226186,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4985, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 4183442, "tid": 4183442, + "ts": 667115216385.796, "dur": 8000.638, + "args": { + "External id": 226187,"Record function id": 0, "Ev Idx": 4986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216480.343, "dur": 5.373, + "args": { + "External id": 226188,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216488.595, "dur": 1.031, + "args": { + "External id": 226189,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216516.187, "dur": 3.377, + "args": { + "External id": 226190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216521.464, "dur": 1.177, + "args": { + "External id": 226191,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216523.884, "dur": 1.042, + "args": { + "External id": 226192,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216528.403, "dur": 1.257, + "args": { + "External id": 226193,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216532.797, "dur": 1.362, + "args": { + "External id": 226194,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216535.617, "dur": 2.222, + "args": { + "External id": 226195,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216539.135, "dur": 1.164, + "args": { + "External id": 226196,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115216544.415, "dur": 0.791, + "args": { + "External id": 226197,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115216563.179, "dur": 7784.366, + "args": { + "External id": 226198,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115216580.106, "dur": 7761.213, + "args": { + "External id": 226199,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115216597.284, "dur": 15.945, + "args": { + "External id": 226200,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115216615.613, "dur": 7692.484, + "args": { + "External id": 226201,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115216618.103, "dur": 7689.544, + "args": { + "External id": 226202,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115216624.350, "dur": 5.529, + "args": { + "External id": 226203,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115216631.454, "dur": 7673.422, + "args": { + "External id": 226204,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115224547.007, "dur": 30.561, + "args": { + "External id": 226205,"Sequence number": 2757749, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5004 + } + }, + { + "ph": "s", "id": 207, "pid": 4183442, "tid": 4183442, "ts": 667115224547.007, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115224563.208, "dur": 9.545, + "args": { + "External id": 226206,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115224568.082, "dur": 4.303, + "args": { + "External id": 226207,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115224645.335, "dur": 117.519, + "args": { + "External id": 226208,"Record function id": 0, "Ev Idx": 5007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115224765.770, "dur": 1070.259, + "args": { + "External id": 226209,"Record function id": 0, "Ev Idx": 5008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115224810.325, "dur": 1011.488, + "args": { + "External id": 226210,"Sequence number": 2757750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5009 + } + }, + { + "ph": "s", "id": 206, "pid": 4183442, "tid": 4183442, "ts": 667115224810.325, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115224879.490, "dur": 42.770, + "args": { + "External id": 226211,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115224935.473, "dur": 90.033, + "args": { + "External id": 226212,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115225037.593, "dur": 34.852, + "args": { + "External id": 226213,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115225081.428, "dur": 29.268, + "args": { + "External id": 226214,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115225136.242, "dur": 25.350, + "args": { + "External id": 226215,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115225182.080, "dur": 13.681, + "args": { + "External id": 226216,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115225215.706, "dur": 131.127, + "args": { + "External id": 226217,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115225264.932, "dur": 12.894, + "args": { + "External id": 226218,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115225269.489, "dur": 7.553, + "args": { + "External id": 226219,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115225282.208, "dur": 4.123, + "args": { + "External id": 226220,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115225287.668, "dur": 0.908, + "args": { + "External id": 226221,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115225290.878, "dur": 4.689, + "args": { + "External id": 226222,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115225358.830, "dur": 42.174, + "args": { + "External id": 226223,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115225429.100, "dur": 26.454, + "args": { + "External id": 226224,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115225464.647, "dur": 59.425, + "args": { + "External id": 226225,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115225535.672, "dur": 34.850, + "args": { + "External id": 226226,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115225595.365, "dur": 27.440, + "args": { + "External id": 226227,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115225629.128, "dur": 67.245, + "args": { + "External id": 226228,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115225723.431, "dur": 22.012, + "args": { + "External id": 226229,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5028 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.2)", "pid": 4183442, "tid": 4183442, + "ts": 667115225900.214, "dur": 83.254, + "args": { + "External id": 226230,"Record function id": 0, "Ev Idx": 5029 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115226056.692, "dur": 46.537, + "args": { + "External id": 226231,"Record function id": 0, "Ev Idx": 5030 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.3)", "pid": 4183442, "tid": 4183442, + "ts": 667115226111.947, "dur": 8848.277, + "args": { + "External id": 226232,"Record function id": 0, "Ev Idx": 5031 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 4183442, "tid": 4183442, + "ts": 667115226123.243, "dur": 940.639, + "args": { + "External id": 226233,"Record function id": 0, "Ev Idx": 5032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115226203.123, "dur": 8.167, + "args": { + "External id": 226234,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115226223.999, "dur": 46.134, + "args": { + "External id": 226235,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226231.554, "dur": 2.218, + "args": { + "External id": 226236,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226237.892, "dur": 0.373, + "args": { + "External id": 226237,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226241.961, "dur": 0.204, + "args": { + "External id": 226238,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226247.400, "dur": 0.316, + "args": { + "External id": 226239,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226250.953, "dur": 0.630, + "args": { + "External id": 226240,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226253.764, "dur": 0.768, + "args": { + "External id": 226241,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226255.158, "dur": 3.446, + "args": { + "External id": 226242,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226259.481, "dur": 0.412, + "args": { + "External id": 226243,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226262.838, "dur": 0.501, + "args": { + "External id": 226244,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115226280.395, "dur": 40.654, + "args": { + "External id": 226245,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115226352.240, "dur": 131.196, + "args": { + "External id": 226246,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115226366.730, "dur": 3.482, + "args": { + "External id": 226247,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115226374.858, "dur": 9.540, + "args": { + "External id": 226248,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115226379.216, "dur": 4.795, + "args": { + "External id": 226249,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226382.147, "dur": 0.582, + "args": { + "External id": 226250,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115226390.717, "dur": 34.349, + "args": { + "External id": 226251,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226394.437, "dur": 2.790, + "args": { + "External id": 226252,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226398.109, "dur": 0.182, + "args": { + "External id": 226253,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226399.147, "dur": 0.354, + "args": { + "External id": 226254,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226404.488, "dur": 1.223, + "args": { + "External id": 226255,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226406.489, "dur": 0.356, + "args": { + "External id": 226256,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226407.683, "dur": 0.327, + "args": { + "External id": 226257,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226411.883, "dur": 0.486, + "args": { + "External id": 226258,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226413.018, "dur": 0.519, + "args": { + "External id": 226259,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115226417.053, "dur": 2.632, + "args": { + "External id": 226260,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115226449.431, "dur": 26.028, + "args": { + "External id": 226261,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115226557.240, "dur": 406.857, + "args": { + "External id": 226262,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115226592.004, "dur": 367.024, + "args": { + "External id": 226263,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5062, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115226603.331, "dur": 350.246, + "args": { + "External id": 226264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115226987.983, "dur": 2.467, + "args": { + "External id": 226265,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5064, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 4183442, "tid": 4183442, + "ts": 667115227085.805, "dur": 7669.980, + "args": { + "External id": 226266,"Record function id": 0, "Ev Idx": 5065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227193.168, "dur": 6.689, + "args": { + "External id": 226267,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227203.287, "dur": 1.226, + "args": { + "External id": 226268,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227206.187, "dur": 2.121, + "args": { + "External id": 226269,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227209.870, "dur": 1.060, + "args": { + "External id": 226270,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227212.342, "dur": 1.126, + "args": { + "External id": 226271,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227217.171, "dur": 0.927, + "args": { + "External id": 226272,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227222.494, "dur": 1.111, + "args": { + "External id": 226273,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227224.962, "dur": 2.546, + "args": { + "External id": 226274,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227228.745, "dur": 0.854, + "args": { + "External id": 226275,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115227233.508, "dur": 0.847, + "args": { + "External id": 226276,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115227251.877, "dur": 7465.881, + "args": { + "External id": 226277,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115227269.030, "dur": 7442.214, + "args": { + "External id": 226278,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115227285.224, "dur": 15.468, + "args": { + "External id": 226279,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115227303.128, "dur": 7372.996, + "args": { + "External id": 226280,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115227305.565, "dur": 7369.916, + "args": { + "External id": 226281,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115227311.790, "dur": 5.886, + "args": { + "External id": 226282,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115227319.281, "dur": 7331.347, + "args": { + "External id": 226283,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115234894.965, "dur": 39.940, + "args": { + "External id": 226284,"Sequence number": 2757751, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5083 + } + }, + { + "ph": "s", "id": 205, "pid": 4183442, "tid": 4183442, "ts": 667115234894.965, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115234919.804, "dur": 10.262, + "args": { + "External id": 226285,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115234925.349, "dur": 4.456, + "args": { + "External id": 226286,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115234999.757, "dur": 88.531, + "args": { + "External id": 226287,"Record function id": 0, "Ev Idx": 5086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115235089.883, "dur": 1108.040, + "args": { + "External id": 226288,"Record function id": 0, "Ev Idx": 5087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115235125.920, "dur": 1058.193, + "args": { + "External id": 226289,"Sequence number": 2757752, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5088 + } + }, + { + "ph": "s", "id": 204, "pid": 4183442, "tid": 4183442, "ts": 667115235125.920, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115235190.776, "dur": 38.764, + "args": { + "External id": 226290,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115235241.662, "dur": 91.326, + "args": { + "External id": 226291,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115235345.504, "dur": 34.551, + "args": { + "External id": 226292,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115235385.939, "dur": 29.262, + "args": { + "External id": 226293,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115235444.450, "dur": 26.711, + "args": { + "External id": 226294,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115235488.282, "dur": 36.234, + "args": { + "External id": 226295,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115235544.404, "dur": 171.376, + "args": { + "External id": 226296,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115235594.427, "dur": 11.562, + "args": { + "External id": 226297,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115235599.025, "dur": 6.224, + "args": { + "External id": 226298,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115235610.456, "dur": 6.070, + "args": { + "External id": 226299,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115235617.838, "dur": 1.081, + "args": { + "External id": 226300,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115235623.507, "dur": 3.152, + "args": { + "External id": 226301,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115235728.524, "dur": 55.833, + "args": { + "External id": 226302,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115235817.122, "dur": 30.350, + "args": { + "External id": 226303,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115235856.187, "dur": 38.908, + "args": { + "External id": 226304,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115235930.596, "dur": 49.398, + "args": { + "External id": 226305,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115236008.471, "dur": 27.624, + "args": { + "External id": 226306,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115236041.938, "dur": 36.365, + "args": { + "External id": 226307,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115236097.135, "dur": 20.653, + "args": { + "External id": 226308,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5107 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.3)", "pid": 4183442, "tid": 4183442, + "ts": 667115236260.761, "dur": 76.925, + "args": { + "External id": 226309,"Record function id": 0, "Ev Idx": 5108 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115236409.539, "dur": 49.949, + "args": { + "External id": 226310,"Record function id": 0, "Ev Idx": 5109 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.4)", "pid": 4183442, "tid": 4183442, + "ts": 667115236469.411, "dur": 8850.472, + "args": { + "External id": 226311,"Record function id": 0, "Ev Idx": 5110 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 4183442, "tid": 4183442, + "ts": 667115236479.554, "dur": 919.274, + "args": { + "External id": 226312,"Record function id": 0, "Ev Idx": 5111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115236585.308, "dur": 9.367, + "args": { + "External id": 226313,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115236607.739, "dur": 40.737, + "args": { + "External id": 226314,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236615.785, "dur": 2.164, + "args": { + "External id": 226315,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236622.504, "dur": 0.243, + "args": { + "External id": 226316,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236626.351, "dur": 0.361, + "args": { + "External id": 226317,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236627.218, "dur": 0.267, + "args": { + "External id": 226318,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236630.742, "dur": 0.443, + "args": { + "External id": 226319,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236633.481, "dur": 0.402, + "args": { + "External id": 226320,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236634.408, "dur": 3.550, + "args": { + "External id": 226321,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236638.485, "dur": 0.538, + "args": { + "External id": 226322,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236641.502, "dur": 0.398, + "args": { + "External id": 226323,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115236697.900, "dur": 46.347, + "args": { + "External id": 226324,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115236778.964, "dur": 118.297, + "args": { + "External id": 226325,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115236794.723, "dur": 4.676, + "args": { + "External id": 226326,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115236804.377, "dur": 10.692, + "args": { + "External id": 226327,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115236808.670, "dur": 5.979, + "args": { + "External id": 226328,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236811.829, "dur": 1.130, + "args": { + "External id": 226329,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115236821.737, "dur": 31.851, + "args": { + "External id": 226330,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236824.990, "dur": 3.290, + "args": { + "External id": 226331,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236829.288, "dur": 0.466, + "args": { + "External id": 226332,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236830.304, "dur": 0.400, + "args": { + "External id": 226333,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236834.809, "dur": 1.195, + "args": { + "External id": 226334,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236836.740, "dur": 0.311, + "args": { + "External id": 226335,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236837.975, "dur": 0.300, + "args": { + "External id": 226336,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236842.143, "dur": 0.291, + "args": { + "External id": 226337,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236843.341, "dur": 0.173, + "args": { + "External id": 226338,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115236846.190, "dur": 2.306, + "args": { + "External id": 226339,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115236865.039, "dur": 23.440, + "args": { + "External id": 226340,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115236949.585, "dur": 361.798, + "args": { + "External id": 226341,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115236984.331, "dur": 322.465, + "args": { + "External id": 226342,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5141, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115236994.416, "dur": 306.585, + "args": { + "External id": 226343,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115237332.158, "dur": 2.217, + "args": { + "External id": 226344,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5143, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 4183442, "tid": 4183442, + "ts": 667115237418.748, "dur": 7713.086, + "args": { + "External id": 226345,"Record function id": 0, "Ev Idx": 5144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237538.149, "dur": 6.275, + "args": { + "External id": 226346,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237547.987, "dur": 1.206, + "args": { + "External id": 226347,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237551.023, "dur": 2.359, + "args": { + "External id": 226348,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237555.066, "dur": 0.904, + "args": { + "External id": 226349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237557.685, "dur": 0.886, + "args": { + "External id": 226350,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237559.942, "dur": 1.238, + "args": { + "External id": 226351,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237566.238, "dur": 1.056, + "args": { + "External id": 226352,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237568.650, "dur": 2.497, + "args": { + "External id": 226353,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237572.468, "dur": 0.683, + "args": { + "External id": 226354,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115237574.560, "dur": 0.841, + "args": { + "External id": 226355,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115237595.213, "dur": 7498.722, + "args": { + "External id": 226356,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115237612.312, "dur": 7474.871, + "args": { + "External id": 226357,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115237628.255, "dur": 15.148, + "args": { + "External id": 226358,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115237645.844, "dur": 7411.405, + "args": { + "External id": 226359,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115237648.436, "dur": 7408.310, + "args": { + "External id": 226360,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115237690.308, "dur": 5.914, + "args": { + "External id": 226361,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115237698.266, "dur": 7355.649, + "args": { + "External id": 226362,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115245266.535, "dur": 28.904, + "args": { + "External id": 226363,"Sequence number": 2757753, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5162 + } + }, + { + "ph": "s", "id": 203, "pid": 4183442, "tid": 4183442, "ts": 667115245266.535, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115245282.094, "dur": 8.790, + "args": { + "External id": 226364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115245286.616, "dur": 4.046, + "args": { + "External id": 226365,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115245358.341, "dur": 84.624, + "args": { + "External id": 226366,"Record function id": 0, "Ev Idx": 5165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115245444.723, "dur": 1090.229, + "args": { + "External id": 226367,"Record function id": 0, "Ev Idx": 5166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115245484.578, "dur": 1035.882, + "args": { + "External id": 226368,"Sequence number": 2757754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5167 + } + }, + { + "ph": "s", "id": 202, "pid": 4183442, "tid": 4183442, "ts": 667115245484.578, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115245577.604, "dur": 42.475, + "args": { + "External id": 226369,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115245633.071, "dur": 131.695, + "args": { + "External id": 226370,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115245777.915, "dur": 36.591, + "args": { + "External id": 226371,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115245824.107, "dur": 29.214, + "args": { + "External id": 226372,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115245880.978, "dur": 25.917, + "args": { + "External id": 226373,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115245923.669, "dur": 14.871, + "args": { + "External id": 226374,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115245958.613, "dur": 129.287, + "args": { + "External id": 226375,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115246008.193, "dur": 11.381, + "args": { + "External id": 226376,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115246012.630, "dur": 5.925, + "args": { + "External id": 226377,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115246024.279, "dur": 5.690, + "args": { + "External id": 226378,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115246031.310, "dur": 1.083, + "args": { + "External id": 226379,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115246034.781, "dur": 3.602, + "args": { + "External id": 226380,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115246098.496, "dur": 43.084, + "args": { + "External id": 226381,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115246171.359, "dur": 28.090, + "args": { + "External id": 226382,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115246208.651, "dur": 37.874, + "args": { + "External id": 226383,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115246254.485, "dur": 31.264, + "args": { + "External id": 226384,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115246309.156, "dur": 25.107, + "args": { + "External id": 226385,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115246340.966, "dur": 47.108, + "args": { + "External id": 226386,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115246407.197, "dur": 17.135, + "args": { + "External id": 226387,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5186 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.4)", "pid": 4183442, "tid": 4183442, + "ts": 667115246600.193, "dur": 127.442, + "args": { + "External id": 226388,"Record function id": 0, "Ev Idx": 5187 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115246806.272, "dur": 49.797, + "args": { + "External id": 226389,"Record function id": 0, "Ev Idx": 5188 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.5)", "pid": 4183442, "tid": 4183442, + "ts": 667115246865.218, "dur": 9067.421, + "args": { + "External id": 226390,"Record function id": 0, "Ev Idx": 5189 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 4183442, "tid": 4183442, + "ts": 667115246876.792, "dur": 940.055, + "args": { + "External id": 226391,"Record function id": 0, "Ev Idx": 5190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115246962.053, "dur": 9.400, + "args": { + "External id": 226392,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115246984.115, "dur": 42.111, + "args": { + "External id": 226393,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115246991.824, "dur": 2.347, + "args": { + "External id": 226394,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115246998.995, "dur": 0.581, + "args": { + "External id": 226395,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247002.003, "dur": 0.624, + "args": { + "External id": 226396,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247003.388, "dur": 0.372, + "args": { + "External id": 226397,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247006.843, "dur": 0.611, + "args": { + "External id": 226398,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247010.064, "dur": 0.660, + "args": { + "External id": 226399,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247011.421, "dur": 2.837, + "args": { + "External id": 226400,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247014.996, "dur": 0.700, + "args": { + "External id": 226401,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247018.514, "dur": 0.159, + "args": { + "External id": 226402,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115247037.920, "dur": 45.239, + "args": { + "External id": 226403,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115247115.533, "dur": 121.887, + "args": { + "External id": 226404,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115247129.772, "dur": 3.663, + "args": { + "External id": 226405,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115247138.558, "dur": 9.591, + "args": { + "External id": 226406,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115247142.815, "dur": 4.910, + "args": { + "External id": 226407,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247145.755, "dur": 0.696, + "args": { + "External id": 226408,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115247154.454, "dur": 35.234, + "args": { + "External id": 226409,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247157.843, "dur": 2.822, + "args": { + "External id": 226410,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247161.701, "dur": 0.477, + "args": { + "External id": 226411,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247163.038, "dur": 0.535, + "args": { + "External id": 226412,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247169.090, "dur": 2.336, + "args": { + "External id": 226413,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247172.090, "dur": 0.522, + "args": { + "External id": 226414,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247173.299, "dur": 0.439, + "args": { + "External id": 226415,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247178.650, "dur": 0.147, + "args": { + "External id": 226416,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247179.590, "dur": 0.532, + "args": { + "External id": 226417,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115247182.325, "dur": 2.277, + "args": { + "External id": 226418,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115247204.858, "dur": 24.312, + "args": { + "External id": 226419,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115247289.361, "dur": 426.087, + "args": { + "External id": 226420,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115247321.028, "dur": 388.971, + "args": { + "External id": 226421,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5220, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115247330.727, "dur": 373.192, + "args": { + "External id": 226422,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115247740.868, "dur": 3.261, + "args": { + "External id": 226423,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5222, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 4183442, "tid": 4183442, + "ts": 667115247837.659, "dur": 7902.813, + "args": { + "External id": 226424,"Record function id": 0, "Ev Idx": 5223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247937.738, "dur": 6.468, + "args": { + "External id": 226425,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247947.434, "dur": 1.413, + "args": { + "External id": 226426,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247950.538, "dur": 2.998, + "args": { + "External id": 226427,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247955.421, "dur": 1.196, + "args": { + "External id": 226428,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247958.117, "dur": 0.858, + "args": { + "External id": 226429,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247960.944, "dur": 0.840, + "args": { + "External id": 226430,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247965.826, "dur": 1.101, + "args": { + "External id": 226431,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247968.637, "dur": 2.137, + "args": { + "External id": 226432,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247972.184, "dur": 1.125, + "args": { + "External id": 226433,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115247974.693, "dur": 1.015, + "args": { + "External id": 226434,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115247995.031, "dur": 7707.344, + "args": { + "External id": 226435,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115248019.767, "dur": 7675.985, + "args": { + "External id": 226436,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115248034.199, "dur": 14.805, + "args": { + "External id": 226437,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115248051.890, "dur": 7571.823, + "args": { + "External id": 226438,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115248054.405, "dur": 7568.726, + "args": { + "External id": 226439,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115248060.274, "dur": 4.674, + "args": { + "External id": 226440,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115248066.642, "dur": 7553.863, + "args": { + "External id": 226441,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115255878.918, "dur": 28.602, + "args": { + "External id": 226442,"Sequence number": 2757755, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5241 + } + }, + { + "ph": "s", "id": 201, "pid": 4183442, "tid": 4183442, "ts": 667115255878.918, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115255894.430, "dur": 8.577, + "args": { + "External id": 226443,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115255898.420, "dur": 4.327, + "args": { + "External id": 226444,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115255971.910, "dur": 84.989, + "args": { + "External id": 226445,"Record function id": 0, "Ev Idx": 5244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115256058.225, "dur": 1118.772, + "args": { + "External id": 226446,"Record function id": 0, "Ev Idx": 5245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115256097.460, "dur": 1065.207, + "args": { + "External id": 226447,"Sequence number": 2757756, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5246 + } + }, + { + "ph": "s", "id": 200, "pid": 4183442, "tid": 4183442, "ts": 667115256097.460, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115256164.976, "dur": 42.151, + "args": { + "External id": 226448,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115256220.228, "dur": 89.583, + "args": { + "External id": 226449,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115256320.334, "dur": 34.996, + "args": { + "External id": 226450,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115256364.930, "dur": 28.602, + "args": { + "External id": 226451,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115256418.759, "dur": 25.547, + "args": { + "External id": 226452,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115256462.021, "dur": 15.353, + "args": { + "External id": 226453,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115256529.011, "dur": 179.931, + "args": { + "External id": 226454,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115256582.043, "dur": 13.246, + "args": { + "External id": 226455,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115256586.796, "dur": 7.468, + "args": { + "External id": 226456,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115256598.371, "dur": 4.039, + "args": { + "External id": 226457,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115256604.120, "dur": 0.888, + "args": { + "External id": 226458,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115256607.399, "dur": 4.127, + "args": { + "External id": 226459,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115256722.237, "dur": 53.901, + "args": { + "External id": 226460,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115256813.550, "dur": 31.833, + "args": { + "External id": 226461,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115256855.269, "dur": 43.277, + "args": { + "External id": 226462,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115256906.995, "dur": 49.130, + "args": { + "External id": 226463,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115256977.953, "dur": 29.806, + "args": { + "External id": 226464,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115257014.138, "dur": 38.940, + "args": { + "External id": 226465,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115257075.664, "dur": 19.335, + "args": { + "External id": 226466,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5265 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.5)", "pid": 4183442, "tid": 4183442, + "ts": 667115257241.125, "dur": 77.213, + "args": { + "External id": 226467,"Record function id": 0, "Ev Idx": 5266 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115257390.545, "dur": 45.947, + "args": { + "External id": 226468,"Record function id": 0, "Ev Idx": 5267 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.6)", "pid": 4183442, "tid": 4183442, + "ts": 667115257445.100, "dur": 8873.786, + "args": { + "External id": 226469,"Record function id": 0, "Ev Idx": 5268 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 4183442, "tid": 4183442, + "ts": 667115257453.062, "dur": 979.705, + "args": { + "External id": 226470,"Record function id": 0, "Ev Idx": 5269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115257558.961, "dur": 8.639, + "args": { + "External id": 226471,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115257583.989, "dur": 39.822, + "args": { + "External id": 226472,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257589.834, "dur": 2.118, + "args": { + "External id": 226473,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257596.828, "dur": 0.610, + "args": { + "External id": 226474,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257598.957, "dur": 0.625, + "args": { + "External id": 226475,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257601.262, "dur": 0.534, + "args": { + "External id": 226476,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257605.285, "dur": 0.376, + "args": { + "External id": 226477,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257607.088, "dur": 0.341, + "args": { + "External id": 226478,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257609.361, "dur": 3.767, + "args": { + "External id": 226479,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257615.049, "dur": 0.360, + "args": { + "External id": 226480,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257616.764, "dur": 0.150, + "args": { + "External id": 226481,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115257635.327, "dur": 84.293, + "args": { + "External id": 226482,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115257758.708, "dur": 123.120, + "args": { + "External id": 226483,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115257772.450, "dur": 5.349, + "args": { + "External id": 226484,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115257782.563, "dur": 11.065, + "args": { + "External id": 226485,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115257787.240, "dur": 5.970, + "args": { + "External id": 226486,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257791.022, "dur": 0.607, + "args": { + "External id": 226487,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115257800.892, "dur": 33.536, + "args": { + "External id": 226488,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257802.936, "dur": 2.823, + "args": { + "External id": 226489,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257807.454, "dur": 0.430, + "args": { + "External id": 226490,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257809.581, "dur": 0.478, + "args": { + "External id": 226491,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257814.272, "dur": 1.174, + "args": { + "External id": 226492,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257817.118, "dur": 0.193, + "args": { + "External id": 226493,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257819.404, "dur": 0.164, + "args": { + "External id": 226494,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257823.383, "dur": 0.236, + "args": { + "External id": 226495,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257825.271, "dur": 0.161, + "args": { + "External id": 226496,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115257827.038, "dur": 2.229, + "args": { + "External id": 226497,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115257849.045, "dur": 25.172, + "args": { + "External id": 226498,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115257936.766, "dur": 403.391, + "args": { + "External id": 226499,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115257971.184, "dur": 363.914, + "args": { + "External id": 226500,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5299, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115257982.051, "dur": 347.510, + "args": { + "External id": 226501,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115258363.820, "dur": 2.394, + "args": { + "External id": 226502,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5301, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 4183442, "tid": 4183442, + "ts": 667115258452.514, "dur": 7669.862, + "args": { + "External id": 226503,"Record function id": 0, "Ev Idx": 5302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258568.196, "dur": 6.279, + "args": { + "External id": 226504,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258578.699, "dur": 1.291, + "args": { + "External id": 226505,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258581.985, "dur": 2.107, + "args": { + "External id": 226506,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258585.920, "dur": 1.039, + "args": { + "External id": 226507,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258588.408, "dur": 1.261, + "args": { + "External id": 226508,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258591.355, "dur": 0.769, + "args": { + "External id": 226509,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258595.761, "dur": 0.801, + "args": { + "External id": 226510,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258598.014, "dur": 1.859, + "args": { + "External id": 226511,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258601.362, "dur": 0.747, + "args": { + "External id": 226512,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115258604.025, "dur": 0.909, + "args": { + "External id": 226513,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115258625.793, "dur": 7450.982, + "args": { + "External id": 226514,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115258641.913, "dur": 7428.096, + "args": { + "External id": 226515,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115258703.315, "dur": 16.854, + "args": { + "External id": 226516,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115258723.018, "dur": 7315.173, + "args": { + "External id": 226517,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115258725.483, "dur": 7312.095, + "args": { + "External id": 226518,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115258732.389, "dur": 6.761, + "args": { + "External id": 226519,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115258740.969, "dur": 7294.089, + "args": { + "External id": 226520,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115266265.013, "dur": 28.207, + "args": { + "External id": 226521,"Sequence number": 2757757, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5320 + } + }, + { + "ph": "s", "id": 199, "pid": 4183442, "tid": 4183442, "ts": 667115266265.013, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115266280.621, "dur": 7.913, + "args": { + "External id": 226522,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115266283.875, "dur": 4.371, + "args": { + "External id": 226523,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115266359.232, "dur": 83.155, + "args": { + "External id": 226524,"Record function id": 0, "Ev Idx": 5323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115266444.914, "dur": 1087.162, + "args": { + "External id": 226525,"Record function id": 0, "Ev Idx": 5324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115266486.811, "dur": 1030.638, + "args": { + "External id": 226526,"Sequence number": 2757758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5325 + } + }, + { + "ph": "s", "id": 198, "pid": 4183442, "tid": 4183442, "ts": 667115266486.811, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115266567.314, "dur": 45.295, + "args": { + "External id": 226527,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115266626.313, "dur": 127.052, + "args": { + "External id": 226528,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115266766.936, "dur": 37.553, + "args": { + "External id": 226529,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115266815.376, "dur": 29.185, + "args": { + "External id": 226530,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115266871.771, "dur": 28.132, + "args": { + "External id": 226531,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115266917.481, "dur": 15.575, + "args": { + "External id": 226532,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115266952.682, "dur": 129.243, + "args": { + "External id": 226533,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115267002.555, "dur": 10.867, + "args": { + "External id": 226534,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267007.318, "dur": 5.308, + "args": { + "External id": 226535,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115267016.160, "dur": 6.542, + "args": { + "External id": 226536,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115267023.831, "dur": 1.246, + "args": { + "External id": 226537,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115267027.714, "dur": 3.588, + "args": { + "External id": 226538,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115267092.652, "dur": 41.984, + "args": { + "External id": 226539,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115267165.293, "dur": 28.561, + "args": { + "External id": 226540,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115267202.030, "dur": 37.632, + "args": { + "External id": 226541,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115267248.396, "dur": 31.736, + "args": { + "External id": 226542,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115267303.653, "dur": 24.265, + "args": { + "External id": 226543,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115267333.286, "dur": 50.729, + "args": { + "External id": 226544,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115267404.246, "dur": 25.348, + "args": { + "External id": 226545,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5344 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.6)", "pid": 4183442, "tid": 4183442, + "ts": 667115267595.963, "dur": 110.957, + "args": { + "External id": 226546,"Record function id": 0, "Ev Idx": 5345 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115267783.684, "dur": 46.813, + "args": { + "External id": 226547,"Record function id": 0, "Ev Idx": 5346 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.7)", "pid": 4183442, "tid": 4183442, + "ts": 667115267840.985, "dur": 8724.466, + "args": { + "External id": 226548,"Record function id": 0, "Ev Idx": 5347 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 4183442, "tid": 4183442, + "ts": 667115267848.448, "dur": 928.508, + "args": { + "External id": 226549,"Record function id": 0, "Ev Idx": 5348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115267930.427, "dur": 8.620, + "args": { + "External id": 226550,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115267952.288, "dur": 38.718, + "args": { + "External id": 226551,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267957.659, "dur": 2.112, + "args": { + "External id": 226552,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267965.156, "dur": 0.394, + "args": { + "External id": 226553,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267967.471, "dur": 0.277, + "args": { + "External id": 226554,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267969.263, "dur": 0.384, + "args": { + "External id": 226555,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267972.996, "dur": 0.381, + "args": { + "External id": 226556,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267974.863, "dur": 0.356, + "args": { + "External id": 226557,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267976.827, "dur": 4.057, + "args": { + "External id": 226558,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267982.329, "dur": 0.194, + "args": { + "External id": 226559,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115267983.793, "dur": 0.153, + "args": { + "External id": 226560,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115268002.422, "dur": 42.853, + "args": { + "External id": 226561,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115268080.364, "dur": 117.886, + "args": { + "External id": 226562,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115268092.815, "dur": 3.797, + "args": { + "External id": 226563,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115268101.559, "dur": 10.269, + "args": { + "External id": 226564,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115268106.136, "dur": 5.294, + "args": { + "External id": 226565,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268109.750, "dur": 0.466, + "args": { + "External id": 226566,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115268118.716, "dur": 33.440, + "args": { + "External id": 226567,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268121.064, "dur": 2.720, + "args": { + "External id": 226568,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268125.640, "dur": 0.390, + "args": { + "External id": 226569,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268127.755, "dur": 0.445, + "args": { + "External id": 226570,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268132.093, "dur": 1.419, + "args": { + "External id": 226571,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268135.022, "dur": 0.655, + "args": { + "External id": 226572,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268136.995, "dur": 0.365, + "args": { + "External id": 226573,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268140.668, "dur": 0.156, + "args": { + "External id": 226574,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268142.485, "dur": 0.306, + "args": { + "External id": 226575,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115268144.488, "dur": 2.303, + "args": { + "External id": 226576,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115268167.673, "dur": 22.982, + "args": { + "External id": 226577,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115268251.219, "dur": 386.668, + "args": { + "External id": 226578,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115268286.128, "dur": 346.504, + "args": { + "External id": 226579,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5378, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115268296.198, "dur": 330.974, + "args": { + "External id": 226580,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115268696.315, "dur": 3.876, + "args": { + "External id": 226581,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5380, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 4183442, "tid": 4183442, + "ts": 667115268798.682, "dur": 7553.904, + "args": { + "External id": 226582,"Record function id": 0, "Ev Idx": 5381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268912.045, "dur": 6.760, + "args": { + "External id": 226583,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268922.679, "dur": 1.180, + "args": { + "External id": 226584,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268926.074, "dur": 2.494, + "args": { + "External id": 226585,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268932.331, "dur": 1.248, + "args": { + "External id": 226586,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268935.155, "dur": 0.899, + "args": { + "External id": 226587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268937.719, "dur": 1.138, + "args": { + "External id": 226588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268940.531, "dur": 0.981, + "args": { + "External id": 226589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268945.183, "dur": 2.862, + "args": { + "External id": 226590,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268949.864, "dur": 0.776, + "args": { + "External id": 226591,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115268952.359, "dur": 0.841, + "args": { + "External id": 226592,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115268972.759, "dur": 7337.856, + "args": { + "External id": 226593,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115268988.212, "dur": 7315.739, + "args": { + "External id": 226594,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115269002.801, "dur": 15.984, + "args": { + "External id": 226595,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115269024.067, "dur": 7249.705, + "args": { + "External id": 226596,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115269026.515, "dur": 7246.726, + "args": { + "External id": 226597,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115269032.376, "dur": 6.172, + "args": { + "External id": 226598,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115269040.233, "dur": 7229.944, + "args": { + "External id": 226599,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115276506.133, "dur": 32.656, + "args": { + "External id": 226600,"Sequence number": 2757759, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5399 + } + }, + { + "ph": "s", "id": 197, "pid": 4183442, "tid": 4183442, "ts": 667115276506.133, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115276525.951, "dur": 7.967, + "args": { + "External id": 226601,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115276529.327, "dur": 4.249, + "args": { + "External id": 226602,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115276606.847, "dur": 116.557, + "args": { + "External id": 226603,"Record function id": 0, "Ev Idx": 5402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115276726.555, "dur": 1087.432, + "args": { + "External id": 226604,"Record function id": 0, "Ev Idx": 5403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115276770.862, "dur": 1028.977, + "args": { + "External id": 226605,"Sequence number": 2757760, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5404 + } + }, + { + "ph": "s", "id": 196, "pid": 4183442, "tid": 4183442, "ts": 667115276770.862, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115276840.141, "dur": 43.267, + "args": { + "External id": 226606,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115276896.644, "dur": 90.378, + "args": { + "External id": 226607,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115276996.695, "dur": 35.571, + "args": { + "External id": 226608,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115277041.853, "dur": 29.795, + "args": { + "External id": 226609,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115277095.134, "dur": 25.932, + "args": { + "External id": 226610,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115277139.896, "dur": 16.935, + "args": { + "External id": 226611,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115277176.895, "dur": 138.525, + "args": { + "External id": 226612,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115277228.072, "dur": 11.368, + "args": { + "External id": 226613,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115277233.744, "dur": 4.907, + "args": { + "External id": 226614,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115277242.058, "dur": 6.519, + "args": { + "External id": 226615,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115277256.682, "dur": 0.862, + "args": { + "External id": 226616,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115277259.911, "dur": 3.085, + "args": { + "External id": 226617,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115277326.640, "dur": 42.568, + "args": { + "External id": 226618,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115277400.540, "dur": 29.977, + "args": { + "External id": 226619,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115277439.077, "dur": 37.451, + "args": { + "External id": 226620,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115277484.347, "dur": 51.858, + "args": { + "External id": 226621,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115277561.839, "dur": 29.235, + "args": { + "External id": 226622,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115277597.649, "dur": 44.786, + "args": { + "External id": 226623,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115277701.534, "dur": 24.098, + "args": { + "External id": 226624,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5423 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.7)", "pid": 4183442, "tid": 4183442, + "ts": 667115277880.169, "dur": 77.998, + "args": { + "External id": 226625,"Record function id": 0, "Ev Idx": 5424 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115278029.486, "dur": 46.971, + "args": { + "External id": 226626,"Record function id": 0, "Ev Idx": 5425 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.8)", "pid": 4183442, "tid": 4183442, + "ts": 667115278085.689, "dur": 8804.066, + "args": { + "External id": 226627,"Record function id": 0, "Ev Idx": 5426 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 4183442, "tid": 4183442, + "ts": 667115278094.183, "dur": 917.013, + "args": { + "External id": 226628,"Record function id": 0, "Ev Idx": 5427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115278175.859, "dur": 8.339, + "args": { + "External id": 226629,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115278197.122, "dur": 40.157, + "args": { + "External id": 226630,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278202.592, "dur": 2.173, + "args": { + "External id": 226631,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278209.868, "dur": 0.217, + "args": { + "External id": 226632,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278211.981, "dur": 0.418, + "args": { + "External id": 226633,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278214.109, "dur": 0.483, + "args": { + "External id": 226634,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278218.076, "dur": 0.365, + "args": { + "External id": 226635,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278220.128, "dur": 0.595, + "args": { + "External id": 226636,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278222.002, "dur": 4.086, + "args": { + "External id": 226637,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278227.629, "dur": 0.368, + "args": { + "External id": 226638,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278229.339, "dur": 0.230, + "args": { + "External id": 226639,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115278248.523, "dur": 37.984, + "args": { + "External id": 226640,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115278318.202, "dur": 116.256, + "args": { + "External id": 226641,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115278330.357, "dur": 3.694, + "args": { + "External id": 226642,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115278338.765, "dur": 10.599, + "args": { + "External id": 226643,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115278343.034, "dur": 5.882, + "args": { + "External id": 226644,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278346.981, "dur": 0.548, + "args": { + "External id": 226645,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115278355.950, "dur": 34.011, + "args": { + "External id": 226646,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278357.989, "dur": 2.762, + "args": { + "External id": 226647,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278362.468, "dur": 0.337, + "args": { + "External id": 226648,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278364.278, "dur": 0.588, + "args": { + "External id": 226649,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278368.954, "dur": 1.836, + "args": { + "External id": 226650,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278372.270, "dur": 0.352, + "args": { + "External id": 226651,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278374.227, "dur": 0.544, + "args": { + "External id": 226652,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278378.347, "dur": 0.189, + "args": { + "External id": 226653,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278380.414, "dur": 0.304, + "args": { + "External id": 226654,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115278382.452, "dur": 2.339, + "args": { + "External id": 226655,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115278403.329, "dur": 22.817, + "args": { + "External id": 226656,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115278486.176, "dur": 425.540, + "args": { + "External id": 226657,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115278538.793, "dur": 367.378, + "args": { + "External id": 226658,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5457, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115278549.810, "dur": 347.729, + "args": { + "External id": 226659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115278935.585, "dur": 2.431, + "args": { + "External id": 226660,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5459, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 4183442, "tid": 4183442, + "ts": 667115279033.347, "dur": 7662.285, + "args": { + "External id": 226661,"Record function id": 0, "Ev Idx": 5460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279135.668, "dur": 6.542, + "args": { + "External id": 226662,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279146.144, "dur": 1.051, + "args": { + "External id": 226663,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279149.212, "dur": 2.298, + "args": { + "External id": 226664,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279153.462, "dur": 1.037, + "args": { + "External id": 226665,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279156.144, "dur": 1.134, + "args": { + "External id": 226666,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279158.772, "dur": 0.825, + "args": { + "External id": 226667,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279163.051, "dur": 0.935, + "args": { + "External id": 226668,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279165.768, "dur": 2.063, + "args": { + "External id": 226669,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279169.359, "dur": 1.030, + "args": { + "External id": 226670,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115279171.825, "dur": 0.733, + "args": { + "External id": 226671,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115279202.880, "dur": 7425.186, + "args": { + "External id": 226672,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115279219.551, "dur": 7401.866, + "args": { + "External id": 226673,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115279233.873, "dur": 15.161, + "args": { + "External id": 226674,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115279251.377, "dur": 7338.542, + "args": { + "External id": 226675,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115279254.073, "dur": 7335.293, + "args": { + "External id": 226676,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115279260.667, "dur": 6.392, + "args": { + "External id": 226677,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115279268.651, "dur": 7317.896, + "args": { + "External id": 226678,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115286838.300, "dur": 27.721, + "args": { + "External id": 226679,"Sequence number": 2757761, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5478 + } + }, + { + "ph": "s", "id": 195, "pid": 4183442, "tid": 4183442, "ts": 667115286838.300, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115286853.601, "dur": 7.708, + "args": { + "External id": 226680,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115286856.462, "dur": 4.615, + "args": { + "External id": 226681,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115286928.295, "dur": 86.449, + "args": { + "External id": 226682,"Record function id": 0, "Ev Idx": 5481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115287016.719, "dur": 1101.819, + "args": { + "External id": 226683,"Record function id": 0, "Ev Idx": 5482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115287057.288, "dur": 1047.450, + "args": { + "External id": 226684,"Sequence number": 2757762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5483 + } + }, + { + "ph": "s", "id": 194, "pid": 4183442, "tid": 4183442, "ts": 667115287057.288, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115287123.903, "dur": 40.601, + "args": { + "External id": 226685,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115287177.333, "dur": 88.738, + "args": { + "External id": 226686,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115287275.751, "dur": 34.504, + "args": { + "External id": 226687,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115287320.093, "dur": 29.807, + "args": { + "External id": 226688,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115287374.999, "dur": 25.364, + "args": { + "External id": 226689,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115287417.701, "dur": 13.948, + "args": { + "External id": 226690,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115287449.314, "dur": 149.257, + "args": { + "External id": 226691,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115287515.854, "dur": 11.737, + "args": { + "External id": 226692,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115287520.283, "dur": 6.233, + "args": { + "External id": 226693,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115287530.423, "dur": 6.284, + "args": { + "External id": 226694,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115287538.036, "dur": 1.162, + "args": { + "External id": 226695,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115287541.590, "dur": 3.457, + "args": { + "External id": 226696,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115287609.862, "dur": 85.276, + "args": { + "External id": 226697,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115287732.412, "dur": 33.807, + "args": { + "External id": 226698,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115287774.880, "dur": 42.744, + "args": { + "External id": 226699,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115287825.843, "dur": 47.219, + "args": { + "External id": 226700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115287897.749, "dur": 32.648, + "args": { + "External id": 226701,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115287936.044, "dur": 56.873, + "args": { + "External id": 226702,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115288013.104, "dur": 18.459, + "args": { + "External id": 226703,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5502 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.8)", "pid": 4183442, "tid": 4183442, + "ts": 667115288181.145, "dur": 78.371, + "args": { + "External id": 226704,"Record function id": 0, "Ev Idx": 5503 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115288334.610, "dur": 47.976, + "args": { + "External id": 226705,"Record function id": 0, "Ev Idx": 5504 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.9)", "pid": 4183442, "tid": 4183442, + "ts": 667115288392.118, "dur": 9012.853, + "args": { + "External id": 226706,"Record function id": 0, "Ev Idx": 5505 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 4183442, "tid": 4183442, + "ts": 667115288402.756, "dur": 945.510, + "args": { + "External id": 226707,"Record function id": 0, "Ev Idx": 5506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115288483.733, "dur": 24.204, + "args": { + "External id": 226708,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115288523.752, "dur": 38.747, + "args": { + "External id": 226709,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288529.163, "dur": 2.335, + "args": { + "External id": 226710,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288536.067, "dur": 0.431, + "args": { + "External id": 226711,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288537.941, "dur": 0.596, + "args": { + "External id": 226712,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288540.080, "dur": 0.330, + "args": { + "External id": 226713,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288543.764, "dur": 0.508, + "args": { + "External id": 226714,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288545.758, "dur": 0.270, + "args": { + "External id": 226715,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288547.101, "dur": 3.777, + "args": { + "External id": 226716,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288552.701, "dur": 0.316, + "args": { + "External id": 226717,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288554.710, "dur": 0.262, + "args": { + "External id": 226718,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115288574.919, "dur": 43.499, + "args": { + "External id": 226719,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115288701.700, "dur": 148.238, + "args": { + "External id": 226720,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115288717.489, "dur": 6.040, + "args": { + "External id": 226721,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115288728.742, "dur": 12.098, + "args": { + "External id": 226722,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115288732.936, "dur": 7.499, + "args": { + "External id": 226723,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288737.848, "dur": 0.925, + "args": { + "External id": 226724,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115288748.730, "dur": 39.033, + "args": { + "External id": 226725,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288751.251, "dur": 2.588, + "args": { + "External id": 226726,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288761.861, "dur": 0.313, + "args": { + "External id": 226727,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288763.778, "dur": 0.245, + "args": { + "External id": 226728,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288767.500, "dur": 1.487, + "args": { + "External id": 226729,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288770.322, "dur": 0.299, + "args": { + "External id": 226730,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288772.043, "dur": 2.524, + "args": { + "External id": 226731,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288776.240, "dur": 0.350, + "args": { + "External id": 226732,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288778.273, "dur": 0.244, + "args": { + "External id": 226733,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115288782.153, "dur": 0.202, + "args": { + "External id": 226734,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115288812.465, "dur": 28.667, + "args": { + "External id": 226735,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115288906.256, "dur": 355.201, + "args": { + "External id": 226736,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115288936.386, "dur": 320.676, + "args": { + "External id": 226737,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5536, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115288948.412, "dur": 303.485, + "args": { + "External id": 226738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115289282.522, "dur": 2.388, + "args": { + "External id": 226739,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5538, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 4183442, "tid": 4183442, + "ts": 667115289368.336, "dur": 7843.366, + "args": { + "External id": 226740,"Record function id": 0, "Ev Idx": 5539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289460.417, "dur": 5.285, + "args": { + "External id": 226741,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289469.504, "dur": 1.344, + "args": { + "External id": 226742,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289472.735, "dur": 2.060, + "args": { + "External id": 226743,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289476.504, "dur": 1.161, + "args": { + "External id": 226744,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289479.289, "dur": 1.032, + "args": { + "External id": 226745,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289483.856, "dur": 1.224, + "args": { + "External id": 226746,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289486.873, "dur": 0.873, + "args": { + "External id": 226747,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289489.451, "dur": 22.020, + "args": { + "External id": 226748,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289515.726, "dur": 1.328, + "args": { + "External id": 226749,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115289520.501, "dur": 0.945, + "args": { + "External id": 226750,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115289540.164, "dur": 7626.162, + "args": { + "External id": 226751,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115289555.571, "dur": 7604.311, + "args": { + "External id": 226752,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115289571.157, "dur": 15.749, + "args": { + "External id": 226753,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115289589.530, "dur": 7539.911, + "args": { + "External id": 226754,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115289592.141, "dur": 7536.685, + "args": { + "External id": 226755,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115289598.163, "dur": 7.051, + "args": { + "External id": 226756,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115289606.847, "dur": 7519.031, + "args": { + "External id": 226757,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115297349.326, "dur": 28.290, + "args": { + "External id": 226758,"Sequence number": 2757763, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5557 + } + }, + { + "ph": "s", "id": 193, "pid": 4183442, "tid": 4183442, "ts": 667115297349.326, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115297365.091, "dur": 8.051, + "args": { + "External id": 226759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115297368.454, "dur": 4.480, + "args": { + "External id": 226760,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115297444.156, "dur": 100.084, + "args": { + "External id": 226761,"Record function id": 0, "Ev Idx": 5560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115297547.885, "dur": 1048.573, + "args": { + "External id": 226762,"Record function id": 0, "Ev Idx": 5561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115297590.776, "dur": 992.144, + "args": { + "External id": 226763,"Sequence number": 2757764, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5562 + } + }, + { + "ph": "s", "id": 192, "pid": 4183442, "tid": 4183442, "ts": 667115297590.776, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115297690.283, "dur": 43.550, + "args": { + "External id": 226764,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115297749.543, "dur": 92.028, + "args": { + "External id": 226765,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115297850.741, "dur": 34.617, + "args": { + "External id": 226766,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115297893.223, "dur": 29.335, + "args": { + "External id": 226767,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115297948.838, "dur": 25.319, + "args": { + "External id": 226768,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115297990.654, "dur": 13.570, + "args": { + "External id": 226769,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115298023.454, "dur": 132.773, + "args": { + "External id": 226770,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115298075.490, "dur": 11.695, + "args": { + "External id": 226771,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115298080.580, "dur": 5.841, + "args": { + "External id": 226772,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115298090.026, "dur": 5.890, + "args": { + "External id": 226773,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115298097.233, "dur": 1.650, + "args": { + "External id": 226774,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115298101.070, "dur": 4.198, + "args": { + "External id": 226775,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115298167.200, "dur": 42.442, + "args": { + "External id": 226776,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115298240.640, "dur": 26.577, + "args": { + "External id": 226777,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115298282.551, "dur": 37.615, + "args": { + "External id": 226778,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115298329.612, "dur": 30.953, + "args": { + "External id": 226779,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115298383.461, "dur": 26.036, + "args": { + "External id": 226780,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115298414.688, "dur": 46.112, + "args": { + "External id": 226781,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115298480.039, "dur": 33.781, + "args": { + "External id": 226782,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5581 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.9)", "pid": 4183442, "tid": 4183442, + "ts": 667115298697.428, "dur": 83.289, + "args": { + "External id": 226783,"Record function id": 0, "Ev Idx": 5582 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115298857.374, "dur": 49.912, + "args": { + "External id": 226784,"Record function id": 0, "Ev Idx": 5583 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.10)", "pid": 4183442, "tid": 4183442, + "ts": 667115298917.252, "dur": 9102.275, + "args": { + "External id": 226785,"Record function id": 0, "Ev Idx": 5584 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 4183442, "tid": 4183442, + "ts": 667115298927.093, "dur": 927.742, + "args": { + "External id": 226786,"Record function id": 0, "Ev Idx": 5585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115299011.051, "dur": 9.220, + "args": { + "External id": 226787,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115299033.552, "dur": 37.768, + "args": { + "External id": 226788,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299038.311, "dur": 2.331, + "args": { + "External id": 226789,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299045.372, "dur": 0.233, + "args": { + "External id": 226790,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299046.748, "dur": 0.377, + "args": { + "External id": 226791,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299048.164, "dur": 0.425, + "args": { + "External id": 226792,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299051.598, "dur": 0.444, + "args": { + "External id": 226793,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299053.255, "dur": 0.497, + "args": { + "External id": 226794,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299054.884, "dur": 4.314, + "args": { + "External id": 226795,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299060.431, "dur": 0.368, + "args": { + "External id": 226796,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299062.375, "dur": 0.158, + "args": { + "External id": 226797,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115299083.264, "dur": 41.351, + "args": { + "External id": 226798,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115299158.355, "dur": 109.135, + "args": { + "External id": 226799,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115299168.190, "dur": 4.096, + "args": { + "External id": 226800,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115299177.240, "dur": 9.734, + "args": { + "External id": 226801,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115299181.610, "dur": 4.979, + "args": { + "External id": 226802,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299184.694, "dur": 0.603, + "args": { + "External id": 226803,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115299193.070, "dur": 30.161, + "args": { + "External id": 226804,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299194.719, "dur": 2.860, + "args": { + "External id": 226805,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299199.185, "dur": 0.389, + "args": { + "External id": 226806,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299200.765, "dur": 0.333, + "args": { + "External id": 226807,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299204.522, "dur": 1.383, + "args": { + "External id": 226808,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299207.278, "dur": 0.315, + "args": { + "External id": 226809,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299208.894, "dur": 0.344, + "args": { + "External id": 226810,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299211.595, "dur": 0.251, + "args": { + "External id": 226811,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299213.194, "dur": 0.282, + "args": { + "External id": 226812,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115299214.610, "dur": 2.109, + "args": { + "External id": 226813,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115299234.898, "dur": 23.591, + "args": { + "External id": 226814,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115299320.645, "dur": 430.638, + "args": { + "External id": 226815,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115299352.169, "dur": 393.051, + "args": { + "External id": 226816,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5615, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115299386.763, "dur": 352.104, + "args": { + "External id": 226817,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115299774.985, "dur": 2.505, + "args": { + "External id": 226818,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5617, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 4183442, "tid": 4183442, + "ts": 667115299876.924, "dur": 7952.336, + "args": { + "External id": 226819,"Record function id": 0, "Ev Idx": 5618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115299976.218, "dur": 6.624, + "args": { + "External id": 226820,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115299986.005, "dur": 1.169, + "args": { + "External id": 226821,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115299989.555, "dur": 2.285, + "args": { + "External id": 226822,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115299993.549, "dur": 1.287, + "args": { + "External id": 226823,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115299996.383, "dur": 1.518, + "args": { + "External id": 226824,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115299999.458, "dur": 0.943, + "args": { + "External id": 226825,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115300003.728, "dur": 0.947, + "args": { + "External id": 226826,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115300006.182, "dur": 3.827, + "args": { + "External id": 226827,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115300011.748, "dur": 0.879, + "args": { + "External id": 226828,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115300014.083, "dur": 0.783, + "args": { + "External id": 226829,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115300034.907, "dur": 7751.291, + "args": { + "External id": 226830,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115300051.092, "dur": 7728.595, + "args": { + "External id": 226831,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115300065.329, "dur": 15.124, + "args": { + "External id": 226832,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115300082.764, "dur": 7666.075, + "args": { + "External id": 226833,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115300085.203, "dur": 7663.068, + "args": { + "External id": 226834,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115300090.836, "dur": 6.868, + "args": { + "External id": 226835,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115300099.395, "dur": 7646.356, + "args": { + "External id": 226836,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115307967.007, "dur": 27.950, + "args": { + "External id": 226837,"Sequence number": 2757765, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5636 + } + }, + { + "ph": "s", "id": 191, "pid": 4183442, "tid": 4183442, "ts": 667115307967.007, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115307983.625, "dur": 6.870, + "args": { + "External id": 226838,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115307986.435, "dur": 3.875, + "args": { + "External id": 226839,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115308058.879, "dur": 85.350, + "args": { + "External id": 226840,"Record function id": 0, "Ev Idx": 5639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115308145.972, "dur": 1092.990, + "args": { + "External id": 226841,"Record function id": 0, "Ev Idx": 5640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115308184.736, "dur": 1040.752, + "args": { + "External id": 226842,"Sequence number": 2757766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5641 + } + }, + { + "ph": "s", "id": 190, "pid": 4183442, "tid": 4183442, "ts": 667115308184.736, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115308244.891, "dur": 42.683, + "args": { + "External id": 226843,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115308300.799, "dur": 91.279, + "args": { + "External id": 226844,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115308401.709, "dur": 34.881, + "args": { + "External id": 226845,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115308444.871, "dur": 29.476, + "args": { + "External id": 226846,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115308516.132, "dur": 29.672, + "args": { + "External id": 226847,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115308564.259, "dur": 15.621, + "args": { + "External id": 226848,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115308598.638, "dur": 173.442, + "args": { + "External id": 226849,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115308684.740, "dur": 14.098, + "args": { + "External id": 226850,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115308690.544, "dur": 7.204, + "args": { + "External id": 226851,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115308701.525, "dur": 6.000, + "args": { + "External id": 226852,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115308708.912, "dur": 1.417, + "args": { + "External id": 226853,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115308712.828, "dur": 4.231, + "args": { + "External id": 226854,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115308783.315, "dur": 53.957, + "args": { + "External id": 226855,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115308868.432, "dur": 29.429, + "args": { + "External id": 226856,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115308907.136, "dur": 38.471, + "args": { + "External id": 226857,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115308954.889, "dur": 50.458, + "args": { + "External id": 226858,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115309027.364, "dur": 27.826, + "args": { + "External id": 226859,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115309061.025, "dur": 54.102, + "args": { + "External id": 226860,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115309135.615, "dur": 18.698, + "args": { + "External id": 226861,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5660 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.10)", "pid": 4183442, "tid": 4183442, + "ts": 667115309300.262, "dur": 72.959, + "args": { + "External id": 226862,"Record function id": 0, "Ev Idx": 5661 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115309444.079, "dur": 63.151, + "args": { + "External id": 226863,"Record function id": 0, "Ev Idx": 5662 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.11)", "pid": 4183442, "tid": 4183442, + "ts": 667115309519.562, "dur": 8686.899, + "args": { + "External id": 226864,"Record function id": 0, "Ev Idx": 5663 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 4183442, "tid": 4183442, + "ts": 667115309528.286, "dur": 928.048, + "args": { + "External id": 226865,"Record function id": 0, "Ev Idx": 5664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115309609.530, "dur": 8.598, + "args": { + "External id": 226866,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115309630.897, "dur": 75.418, + "args": { + "External id": 226867,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309635.526, "dur": 2.139, + "args": { + "External id": 226868,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309642.056, "dur": 0.249, + "args": { + "External id": 226869,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309643.431, "dur": 0.283, + "args": { + "External id": 226870,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309644.609, "dur": 0.565, + "args": { + "External id": 226871,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309648.606, "dur": 0.339, + "args": { + "External id": 226872,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309650.482, "dur": 0.227, + "args": { + "External id": 226873,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309688.694, "dur": 4.373, + "args": { + "External id": 226874,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309695.093, "dur": 0.357, + "args": { + "External id": 226875,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309696.977, "dur": 0.411, + "args": { + "External id": 226876,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115309722.007, "dur": 42.673, + "args": { + "External id": 226877,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115309800.553, "dur": 118.877, + "args": { + "External id": 226878,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115309811.570, "dur": 6.960, + "args": { + "External id": 226879,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115309823.770, "dur": 10.810, + "args": { + "External id": 226880,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115309828.197, "dur": 5.947, + "args": { + "External id": 226881,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309831.941, "dur": 0.705, + "args": { + "External id": 226882,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115309841.273, "dur": 31.629, + "args": { + "External id": 226883,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309843.779, "dur": 0.388, + "args": { + "External id": 226884,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309845.879, "dur": 2.466, + "args": { + "External id": 226885,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309849.924, "dur": 0.487, + "args": { + "External id": 226886,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309851.992, "dur": 1.657, + "args": { + "External id": 226887,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309857.829, "dur": 0.397, + "args": { + "External id": 226888,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309859.501, "dur": 0.316, + "args": { + "External id": 226889,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309861.276, "dur": 0.460, + "args": { + "External id": 226890,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309864.993, "dur": 0.277, + "args": { + "External id": 226891,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115309866.595, "dur": 0.290, + "args": { + "External id": 226892,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115309886.047, "dur": 24.772, + "args": { + "External id": 226893,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115309974.631, "dur": 391.411, + "args": { + "External id": 226894,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115310003.004, "dur": 358.357, + "args": { + "External id": 226895,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5694, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115310013.194, "dur": 343.148, + "args": { + "External id": 226896,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115310385.980, "dur": 2.317, + "args": { + "External id": 226897,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5696, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 4183442, "tid": 4183442, + "ts": 667115310478.444, "dur": 7534.840, + "args": { + "External id": 226898,"Record function id": 0, "Ev Idx": 5697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310601.721, "dur": 6.978, + "args": { + "External id": 226899,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310611.941, "dur": 1.117, + "args": { + "External id": 226900,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310614.635, "dur": 2.172, + "args": { + "External id": 226901,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310618.350, "dur": 1.145, + "args": { + "External id": 226902,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310621.325, "dur": 1.017, + "args": { + "External id": 226903,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310623.852, "dur": 0.936, + "args": { + "External id": 226904,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310626.725, "dur": 1.031, + "args": { + "External id": 226905,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310629.928, "dur": 3.340, + "args": { + "External id": 226906,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310634.987, "dur": 0.866, + "args": { + "External id": 226907,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115310637.678, "dur": 0.781, + "args": { + "External id": 226908,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115310691.743, "dur": 7282.967, + "args": { + "External id": 226909,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115310708.893, "dur": 7258.943, + "args": { + "External id": 226910,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115310724.227, "dur": 15.773, + "args": { + "External id": 226911,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115310742.820, "dur": 7194.254, + "args": { + "External id": 226912,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115310745.673, "dur": 7190.954, + "args": { + "External id": 226913,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115310752.091, "dur": 5.867, + "args": { + "External id": 226914,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115310759.444, "dur": 7174.648, + "args": { + "External id": 226915,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115318148.038, "dur": 34.126, + "args": { + "External id": 226916,"Sequence number": 2757767, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5715 + } + }, + { + "ph": "s", "id": 189, "pid": 4183442, "tid": 4183442, "ts": 667115318148.038, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115318170.615, "dur": 7.133, + "args": { + "External id": 226917,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115318173.441, "dur": 4.094, + "args": { + "External id": 226918,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115318245.863, "dur": 86.964, + "args": { + "External id": 226919,"Record function id": 0, "Ev Idx": 5718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115318334.491, "dur": 1080.504, + "args": { + "External id": 226920,"Record function id": 0, "Ev Idx": 5719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115318373.199, "dur": 1028.392, + "args": { + "External id": 226921,"Sequence number": 2757768, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5720 + } + }, + { + "ph": "s", "id": 188, "pid": 4183442, "tid": 4183442, "ts": 667115318373.199, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115318438.827, "dur": 38.802, + "args": { + "External id": 226922,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115318503.648, "dur": 94.905, + "args": { + "External id": 226923,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115318611.241, "dur": 35.352, + "args": { + "External id": 226924,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115318692.101, "dur": 36.308, + "args": { + "External id": 226925,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115318756.508, "dur": 27.159, + "args": { + "External id": 226926,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115318801.330, "dur": 19.953, + "args": { + "External id": 226927,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115318840.324, "dur": 131.260, + "args": { + "External id": 226928,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115318892.507, "dur": 11.223, + "args": { + "External id": 226929,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115318897.408, "dur": 5.566, + "args": { + "External id": 226930,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115318906.403, "dur": 6.054, + "args": { + "External id": 226931,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115318913.714, "dur": 1.286, + "args": { + "External id": 226932,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115318917.451, "dur": 4.527, + "args": { + "External id": 226933,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115318982.378, "dur": 48.572, + "args": { + "External id": 226934,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115319060.621, "dur": 31.033, + "args": { + "External id": 226935,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115319100.849, "dur": 39.427, + "args": { + "External id": 226936,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115319149.989, "dur": 36.231, + "args": { + "External id": 226937,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115319206.914, "dur": 28.048, + "args": { + "External id": 226938,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115319240.562, "dur": 53.787, + "args": { + "External id": 226939,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115319314.962, "dur": 16.076, + "args": { + "External id": 226940,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5739 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.11)", "pid": 4183442, "tid": 4183442, + "ts": 667115319478.276, "dur": 102.626, + "args": { + "External id": 226941,"Record function id": 0, "Ev Idx": 5740 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115319697.493, "dur": 52.121, + "args": { + "External id": 226942,"Record function id": 0, "Ev Idx": 5741 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.12)", "pid": 4183442, "tid": 4183442, + "ts": 667115319759.926, "dur": 8863.775, + "args": { + "External id": 226943,"Record function id": 0, "Ev Idx": 5742 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 4183442, "tid": 4183442, + "ts": 667115319769.300, "dur": 872.640, + "args": { + "External id": 226944,"Record function id": 0, "Ev Idx": 5743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115319854.705, "dur": 9.593, + "args": { + "External id": 226945,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115319880.254, "dur": 40.115, + "args": { + "External id": 226946,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319885.931, "dur": 2.118, + "args": { + "External id": 226947,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319892.942, "dur": 0.347, + "args": { + "External id": 226948,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319894.972, "dur": 0.349, + "args": { + "External id": 226949,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319896.855, "dur": 2.606, + "args": { + "External id": 226950,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319901.117, "dur": 0.437, + "args": { + "External id": 226951,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319903.081, "dur": 0.298, + "args": { + "External id": 226952,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319907.207, "dur": 1.614, + "args": { + "External id": 226953,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319910.616, "dur": 0.397, + "args": { + "External id": 226954,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115319912.484, "dur": 0.252, + "args": { + "External id": 226955,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115319931.923, "dur": 43.813, + "args": { + "External id": 226956,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115320007.300, "dur": 112.420, + "args": { + "External id": 226957,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115320017.770, "dur": 3.940, + "args": { + "External id": 226958,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115320026.757, "dur": 12.611, + "args": { + "External id": 226959,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115320031.269, "dur": 7.699, + "args": { + "External id": 226960,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320034.771, "dur": 2.938, + "args": { + "External id": 226961,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115320046.273, "dur": 30.979, + "args": { + "External id": 226962,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320048.966, "dur": 0.462, + "args": { + "External id": 226963,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320051.392, "dur": 0.403, + "args": { + "External id": 226964,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320053.427, "dur": 0.513, + "args": { + "External id": 226965,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320057.469, "dur": 1.431, + "args": { + "External id": 226966,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320060.400, "dur": 0.494, + "args": { + "External id": 226967,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320062.247, "dur": 2.222, + "args": { + "External id": 226968,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320065.898, "dur": 0.185, + "args": { + "External id": 226969,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320067.664, "dur": 0.196, + "args": { + "External id": 226970,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320071.840, "dur": 0.303, + "args": { + "External id": 226971,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115320089.237, "dur": 23.100, + "args": { + "External id": 226972,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115320172.920, "dur": 374.978, + "args": { + "External id": 226973,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115320199.673, "dur": 343.301, + "args": { + "External id": 226974,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5773, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115320209.656, "dur": 327.912, + "args": { + "External id": 226975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115320570.027, "dur": 2.440, + "args": { + "External id": 226976,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5775, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 4183442, "tid": 4183442, + "ts": 667115320702.425, "dur": 7708.346, + "args": { + "External id": 226977,"Record function id": 0, "Ev Idx": 5776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320812.133, "dur": 6.333, + "args": { + "External id": 226978,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320822.192, "dur": 1.213, + "args": { + "External id": 226979,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320825.172, "dur": 2.338, + "args": { + "External id": 226980,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320828.910, "dur": 0.914, + "args": { + "External id": 226981,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320831.335, "dur": 1.069, + "args": { + "External id": 226982,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320834.784, "dur": 1.061, + "args": { + "External id": 226983,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320837.628, "dur": 1.035, + "args": { + "External id": 226984,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320840.631, "dur": 2.087, + "args": { + "External id": 226985,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320844.448, "dur": 0.720, + "args": { + "External id": 226986,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115320847.218, "dur": 0.740, + "args": { + "External id": 226987,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115320865.765, "dur": 7508.116, + "args": { + "External id": 226988,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115320881.477, "dur": 7485.975, + "args": { + "External id": 226989,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115320899.903, "dur": 15.794, + "args": { + "External id": 226990,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115320918.541, "dur": 7418.339, + "args": { + "External id": 226991,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115320921.061, "dur": 7415.298, + "args": { + "External id": 226992,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115320928.087, "dur": 6.854, + "args": { + "External id": 226993,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115320936.830, "dur": 7396.624, + "args": { + "External id": 226994,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115328562.456, "dur": 34.070, + "args": { + "External id": 226995,"Sequence number": 2757769, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5794 + } + }, + { + "ph": "s", "id": 187, "pid": 4183442, "tid": 4183442, "ts": 667115328562.456, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115328584.611, "dur": 7.205, + "args": { + "External id": 226996,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115328587.428, "dur": 3.990, + "args": { + "External id": 226997,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115328690.935, "dur": 87.894, + "args": { + "External id": 226998,"Record function id": 0, "Ev Idx": 5797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115328780.816, "dur": 1083.592, + "args": { + "External id": 226999,"Record function id": 0, "Ev Idx": 5798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115328823.780, "dur": 1027.052, + "args": { + "External id": 227000,"Sequence number": 2757770, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5799 + } + }, + { + "ph": "s", "id": 186, "pid": 4183442, "tid": 4183442, "ts": 667115328823.780, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115328888.718, "dur": 43.741, + "args": { + "External id": 227001,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115328946.217, "dur": 92.608, + "args": { + "External id": 227002,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115329050.285, "dur": 33.846, + "args": { + "External id": 227003,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115329093.330, "dur": 29.078, + "args": { + "External id": 227004,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115329147.329, "dur": 26.936, + "args": { + "External id": 227005,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115329191.370, "dur": 14.896, + "args": { + "External id": 227006,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115329224.357, "dur": 131.256, + "args": { + "External id": 227007,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115329274.202, "dur": 11.704, + "args": { + "External id": 227008,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115329279.687, "dur": 5.427, + "args": { + "External id": 227009,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115329288.601, "dur": 5.932, + "args": { + "External id": 227010,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115329295.995, "dur": 1.359, + "args": { + "External id": 227011,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115329299.775, "dur": 3.901, + "args": { + "External id": 227012,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115329365.831, "dur": 44.499, + "args": { + "External id": 227013,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115329440.201, "dur": 28.888, + "args": { + "External id": 227014,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115329478.096, "dur": 58.400, + "args": { + "External id": 227015,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115329548.978, "dur": 34.760, + "args": { + "External id": 227016,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115329613.279, "dur": 29.169, + "args": { + "External id": 227017,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115329650.477, "dur": 89.672, + "args": { + "External id": 227018,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115329763.870, "dur": 20.196, + "args": { + "External id": 227019,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5818 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.12)", "pid": 4183442, "tid": 4183442, + "ts": 667115329926.980, "dur": 79.298, + "args": { + "External id": 227020,"Record function id": 0, "Ev Idx": 5819 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115330080.311, "dur": 43.969, + "args": { + "External id": 227021,"Record function id": 0, "Ev Idx": 5820 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.13)", "pid": 4183442, "tid": 4183442, + "ts": 667115330134.127, "dur": 9273.181, + "args": { + "External id": 227022,"Record function id": 0, "Ev Idx": 5821 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 4183442, "tid": 4183442, + "ts": 667115330143.975, "dur": 895.610, + "args": { + "External id": 227023,"Record function id": 0, "Ev Idx": 5822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115330221.339, "dur": 7.844, + "args": { + "External id": 227024,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115330242.645, "dur": 38.897, + "args": { + "External id": 227025,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330248.210, "dur": 2.397, + "args": { + "External id": 227026,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330255.016, "dur": 0.294, + "args": { + "External id": 227027,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330257.022, "dur": 0.390, + "args": { + "External id": 227028,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330259.283, "dur": 0.738, + "args": { + "External id": 227029,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330263.451, "dur": 0.407, + "args": { + "External id": 227030,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330265.298, "dur": 0.353, + "args": { + "External id": 227031,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330267.054, "dur": 3.673, + "args": { + "External id": 227032,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330272.371, "dur": 0.498, + "args": { + "External id": 227033,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330274.735, "dur": 0.326, + "args": { + "External id": 227034,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115330292.960, "dur": 36.922, + "args": { + "External id": 227035,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115330362.158, "dur": 113.708, + "args": { + "External id": 227036,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115330372.953, "dur": 4.332, + "args": { + "External id": 227037,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115330382.578, "dur": 10.009, + "args": { + "External id": 227038,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115330386.811, "dur": 5.363, + "args": { + "External id": 227039,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330390.630, "dur": 0.409, + "args": { + "External id": 227040,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115330399.433, "dur": 32.548, + "args": { + "External id": 227041,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330401.867, "dur": 2.825, + "args": { + "External id": 227042,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330406.366, "dur": 0.420, + "args": { + "External id": 227043,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330408.129, "dur": 0.186, + "args": { + "External id": 227044,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330412.260, "dur": 1.285, + "args": { + "External id": 227045,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330414.968, "dur": 0.361, + "args": { + "External id": 227046,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330416.984, "dur": 0.411, + "args": { + "External id": 227047,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330420.699, "dur": 0.516, + "args": { + "External id": 227048,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330422.523, "dur": 0.205, + "args": { + "External id": 227049,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115330424.535, "dur": 2.518, + "args": { + "External id": 227050,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115330445.948, "dur": 22.081, + "args": { + "External id": 227051,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115330547.134, "dur": 395.172, + "args": { + "External id": 227052,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115330574.941, "dur": 361.702, + "args": { + "External id": 227053,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5852, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115330585.305, "dur": 345.174, + "args": { + "External id": 227054,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115330964.557, "dur": 2.850, + "args": { + "External id": 227055,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5854, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 4183442, "tid": 4183442, + "ts": 667115331061.391, "dur": 8147.039, + "args": { + "External id": 227056,"Record function id": 0, "Ev Idx": 5855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331167.321, "dur": 6.524, + "args": { + "External id": 227057,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331177.119, "dur": 1.098, + "args": { + "External id": 227058,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331180.056, "dur": 1.392, + "args": { + "External id": 227059,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331183.147, "dur": 0.988, + "args": { + "External id": 227060,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331185.488, "dur": 1.088, + "args": { + "External id": 227061,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331188.046, "dur": 1.359, + "args": { + "External id": 227062,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331191.715, "dur": 1.081, + "args": { + "External id": 227063,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331194.625, "dur": 2.348, + "args": { + "External id": 227064,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331198.914, "dur": 1.303, + "args": { + "External id": 227065,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115331202.095, "dur": 1.118, + "args": { + "External id": 227066,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115331222.812, "dur": 7948.034, + "args": { + "External id": 227067,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115331240.489, "dur": 7923.300, + "args": { + "External id": 227068,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115331260.543, "dur": 14.307, + "args": { + "External id": 227069,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115331277.589, "dur": 7852.682, + "args": { + "External id": 227070,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115331280.285, "dur": 7849.447, + "args": { + "External id": 227071,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115331286.245, "dur": 6.918, + "args": { + "External id": 227072,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115331294.782, "dur": 7832.457, + "args": { + "External id": 227073,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115339346.496, "dur": 36.156, + "args": { + "External id": 227074,"Sequence number": 2757771, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5873 + } + }, + { + "ph": "s", "id": 185, "pid": 4183442, "tid": 4183442, "ts": 667115339346.496, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115339367.847, "dur": 9.650, + "args": { + "External id": 227075,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115339370.704, "dur": 6.517, + "args": { + "External id": 227076,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115339446.422, "dur": 101.423, + "args": { + "External id": 227077,"Record function id": 0, "Ev Idx": 5876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115339550.765, "dur": 1076.105, + "args": { + "External id": 227078,"Record function id": 0, "Ev Idx": 5877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115339594.050, "dur": 1018.754, + "args": { + "External id": 227079,"Sequence number": 2757772, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5878 + } + }, + { + "ph": "s", "id": 184, "pid": 4183442, "tid": 4183442, "ts": 667115339594.050, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115339690.376, "dur": 44.281, + "args": { + "External id": 227080,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115339751.092, "dur": 94.363, + "args": { + "External id": 227081,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115339855.345, "dur": 34.539, + "args": { + "External id": 227082,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115339899.584, "dur": 29.932, + "args": { + "External id": 227083,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115339953.934, "dur": 26.843, + "args": { + "External id": 227084,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115339998.660, "dur": 17.541, + "args": { + "External id": 227085,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115340034.028, "dur": 132.086, + "args": { + "External id": 227086,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115340084.158, "dur": 12.078, + "args": { + "External id": 227087,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115340089.422, "dur": 5.990, + "args": { + "External id": 227088,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115340099.296, "dur": 6.280, + "args": { + "External id": 227089,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115340107.108, "dur": 1.704, + "args": { + "External id": 227090,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115340111.101, "dur": 2.886, + "args": { + "External id": 227091,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115340177.888, "dur": 44.167, + "args": { + "External id": 227092,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115340252.667, "dur": 30.551, + "args": { + "External id": 227093,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115340291.609, "dur": 37.510, + "args": { + "External id": 227094,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115340338.590, "dur": 32.025, + "args": { + "External id": 227095,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115340392.108, "dur": 26.525, + "args": { + "External id": 227096,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115340424.831, "dur": 49.788, + "args": { + "External id": 227097,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115340512.379, "dur": 23.453, + "args": { + "External id": 227098,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5897 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.13)", "pid": 4183442, "tid": 4183442, + "ts": 667115340724.745, "dur": 81.507, + "args": { + "External id": 227099,"Record function id": 0, "Ev Idx": 5898 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115340881.752, "dur": 46.729, + "args": { + "External id": 227100,"Record function id": 0, "Ev Idx": 5899 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.14)", "pid": 4183442, "tid": 4183442, + "ts": 667115340938.694, "dur": 9134.689, + "args": { + "External id": 227101,"Record function id": 0, "Ev Idx": 5900 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 4183442, "tid": 4183442, + "ts": 667115340949.854, "dur": 901.551, + "args": { + "External id": 227102,"Record function id": 0, "Ev Idx": 5901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115341030.899, "dur": 9.432, + "args": { + "External id": 227103,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115341054.146, "dur": 49.309, + "args": { + "External id": 227104,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341065.398, "dur": 3.146, + "args": { + "External id": 227105,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341073.602, "dur": 0.885, + "args": { + "External id": 227106,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341076.024, "dur": 0.876, + "args": { + "External id": 227107,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341078.876, "dur": 2.508, + "args": { + "External id": 227108,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341082.597, "dur": 0.647, + "args": { + "External id": 227109,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341086.764, "dur": 0.618, + "args": { + "External id": 227110,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341090.627, "dur": 0.495, + "args": { + "External id": 227111,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341092.055, "dur": 0.652, + "args": { + "External id": 227112,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341093.612, "dur": 2.520, + "args": { + "External id": 227113,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115341115.211, "dur": 40.237, + "args": { + "External id": 227114,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115341187.056, "dur": 107.500, + "args": { + "External id": 227115,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115341197.222, "dur": 4.903, + "args": { + "External id": 227116,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115341207.199, "dur": 10.337, + "args": { + "External id": 227117,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115341211.520, "dur": 5.565, + "args": { + "External id": 227118,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341215.031, "dur": 0.849, + "args": { + "External id": 227119,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115341224.692, "dur": 28.992, + "args": { + "External id": 227120,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341226.777, "dur": 0.784, + "args": { + "External id": 227121,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341229.581, "dur": 0.746, + "args": { + "External id": 227122,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341231.474, "dur": 2.375, + "args": { + "External id": 227123,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341235.209, "dur": 0.680, + "args": { + "External id": 227124,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341237.110, "dur": 0.429, + "args": { + "External id": 227125,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341241.507, "dur": 0.412, + "args": { + "External id": 227126,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341243.237, "dur": 0.635, + "args": { + "External id": 227127,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341244.929, "dur": 0.625, + "args": { + "External id": 227128,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115341248.466, "dur": 0.413, + "args": { + "External id": 227129,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115341264.674, "dur": 22.169, + "args": { + "External id": 227130,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115341346.207, "dur": 406.404, + "args": { + "External id": 227131,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115341372.089, "dur": 374.295, + "args": { + "External id": 227132,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5931, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115341382.109, "dur": 358.034, + "args": { + "External id": 227133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115341775.644, "dur": 2.493, + "args": { + "External id": 227134,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5933, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 4183442, "tid": 4183442, + "ts": 667115341872.997, "dur": 8006.307, + "args": { + "External id": 227135,"Record function id": 0, "Ev Idx": 5934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115341978.730, "dur": 7.018, + "args": { + "External id": 227136,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115341989.147, "dur": 1.619, + "args": { + "External id": 227137,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115341992.468, "dur": 1.699, + "args": { + "External id": 227138,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115341996.096, "dur": 1.063, + "args": { + "External id": 227139,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115341998.867, "dur": 1.380, + "args": { + "External id": 227140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115342002.345, "dur": 0.955, + "args": { + "External id": 227141,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115342005.644, "dur": 1.358, + "args": { + "External id": 227142,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115342008.833, "dur": 3.022, + "args": { + "External id": 227143,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115342013.700, "dur": 1.486, + "args": { + "External id": 227144,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115342017.295, "dur": 1.092, + "args": { + "External id": 227145,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115342036.547, "dur": 7804.803, + "args": { + "External id": 227146,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115342051.142, "dur": 7784.002, + "args": { + "External id": 227147,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115342070.716, "dur": 15.001, + "args": { + "External id": 227148,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115342088.163, "dur": 7716.961, + "args": { + "External id": 227149,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115342090.791, "dur": 7713.820, + "args": { + "External id": 227150,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115342096.634, "dur": 7.159, + "args": { + "External id": 227151,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115342105.429, "dur": 7696.290, + "args": { + "External id": 227152,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115350020.334, "dur": 29.181, + "args": { + "External id": 227153,"Sequence number": 2757773, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5952 + } + }, + { + "ph": "s", "id": 183, "pid": 4183442, "tid": 4183442, "ts": 667115350020.334, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115350036.639, "dur": 7.909, + "args": { + "External id": 227154,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115350039.757, "dur": 4.533, + "args": { + "External id": 227155,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115350112.185, "dur": 84.076, + "args": { + "External id": 227156,"Record function id": 0, "Ev Idx": 5955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115350198.066, "dur": 1092.333, + "args": { + "External id": 227157,"Record function id": 0, "Ev Idx": 5956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115350237.307, "dur": 1039.676, + "args": { + "External id": 227158,"Sequence number": 2757774, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5957 + } + }, + { + "ph": "s", "id": 182, "pid": 4183442, "tid": 4183442, "ts": 667115350237.307, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115350300.460, "dur": 40.214, + "args": { + "External id": 227159,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115350354.075, "dur": 88.451, + "args": { + "External id": 227160,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115350452.098, "dur": 34.790, + "args": { + "External id": 227161,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115350515.248, "dur": 33.830, + "args": { + "External id": 227162,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115350574.183, "dur": 27.963, + "args": { + "External id": 227163,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115350620.556, "dur": 13.713, + "args": { + "External id": 227164,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115350685.721, "dur": 147.351, + "args": { + "External id": 227165,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115350748.373, "dur": 12.766, + "args": { + "External id": 227166,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115350753.052, "dur": 7.202, + "args": { + "External id": 227167,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115350763.818, "dur": 6.058, + "args": { + "External id": 227168,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115350771.226, "dur": 1.969, + "args": { + "External id": 227169,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115350776.062, "dur": 3.319, + "args": { + "External id": 227170,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115350845.258, "dur": 52.421, + "args": { + "External id": 227171,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115350930.973, "dur": 29.825, + "args": { + "External id": 227172,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115350969.234, "dur": 38.728, + "args": { + "External id": 227173,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115351017.246, "dur": 49.509, + "args": { + "External id": 227174,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115351088.860, "dur": 28.550, + "args": { + "External id": 227175,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115351123.599, "dur": 47.396, + "args": { + "External id": 227176,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115351191.338, "dur": 18.348, + "args": { + "External id": 227177,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5976 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.14)", "pid": 4183442, "tid": 4183442, + "ts": 667115351353.248, "dur": 78.034, + "args": { + "External id": 227178,"Record function id": 0, "Ev Idx": 5977 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115351524.376, "dur": 50.605, + "args": { + "External id": 227179,"Record function id": 0, "Ev Idx": 5978 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.15)", "pid": 4183442, "tid": 4183442, + "ts": 667115351584.683, "dur": 9529.613, + "args": { + "External id": 227180,"Record function id": 0, "Ev Idx": 5979 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 4183442, "tid": 4183442, + "ts": 667115351594.136, "dur": 883.384, + "args": { + "External id": 227181,"Record function id": 0, "Ev Idx": 5980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115351714.711, "dur": 10.308, + "args": { + "External id": 227182,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115351739.464, "dur": 39.057, + "args": { + "External id": 227183,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351744.810, "dur": 2.810, + "args": { + "External id": 227184,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351752.874, "dur": 0.483, + "args": { + "External id": 227185,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351754.476, "dur": 0.404, + "args": { + "External id": 227186,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351756.229, "dur": 0.987, + "args": { + "External id": 227187,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351760.353, "dur": 0.583, + "args": { + "External id": 227188,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351762.589, "dur": 0.653, + "args": { + "External id": 227189,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351764.440, "dur": 2.825, + "args": { + "External id": 227190,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351768.751, "dur": 0.569, + "args": { + "External id": 227191,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351770.732, "dur": 0.545, + "args": { + "External id": 227192,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115351790.858, "dur": 41.638, + "args": { + "External id": 227193,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115351866.992, "dur": 119.035, + "args": { + "External id": 227194,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115351877.915, "dur": 4.490, + "args": { + "External id": 227195,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115351887.432, "dur": 10.234, + "args": { + "External id": 227196,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115351891.823, "dur": 5.410, + "args": { + "External id": 227197,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351895.310, "dur": 0.675, + "args": { + "External id": 227198,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115351904.123, "dur": 30.580, + "args": { + "External id": 227199,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351905.790, "dur": 3.587, + "args": { + "External id": 227200,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351910.629, "dur": 0.907, + "args": { + "External id": 227201,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351912.699, "dur": 0.601, + "args": { + "External id": 227202,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351916.888, "dur": 0.517, + "args": { + "External id": 227203,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351918.497, "dur": 0.701, + "args": { + "External id": 227204,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351920.841, "dur": 0.344, + "args": { + "External id": 227205,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351923.989, "dur": 0.341, + "args": { + "External id": 227206,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351925.620, "dur": 0.428, + "args": { + "External id": 227207,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115351927.067, "dur": 2.133, + "args": { + "External id": 227208,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115351955.321, "dur": 21.418, + "args": { + "External id": 227209,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115352040.770, "dur": 350.288, + "args": { + "External id": 227210,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115352065.901, "dur": 321.012, + "args": { + "External id": 227211,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6010, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115352077.694, "dur": 303.796, + "args": { + "External id": 227212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115352410.402, "dur": 2.340, + "args": { + "External id": 227213,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6012, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 4183442, "tid": 4183442, + "ts": 667115352518.658, "dur": 8395.300, + "args": { + "External id": 227214,"Record function id": 0, "Ev Idx": 6013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352619.395, "dur": 6.859, + "args": { + "External id": 227215,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352629.519, "dur": 1.642, + "args": { + "External id": 227216,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352632.680, "dur": 1.401, + "args": { + "External id": 227217,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352635.866, "dur": 1.320, + "args": { + "External id": 227218,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352638.672, "dur": 1.519, + "args": { + "External id": 227219,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352641.763, "dur": 1.298, + "args": { + "External id": 227220,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352645.082, "dur": 1.294, + "args": { + "External id": 227221,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352648.127, "dur": 2.306, + "args": { + "External id": 227222,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352687.211, "dur": 2.137, + "args": { + "External id": 227223,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115352691.776, "dur": 1.151, + "args": { + "External id": 227224,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115352712.338, "dur": 8161.227, + "args": { + "External id": 227225,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115352727.767, "dur": 8139.274, + "args": { + "External id": 227226,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115352743.583, "dur": 14.837, + "args": { + "External id": 227227,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115352761.338, "dur": 8075.903, + "args": { + "External id": 227228,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115352763.730, "dur": 8072.993, + "args": { + "External id": 227229,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115352770.391, "dur": 7.891, + "args": { + "External id": 227230,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115352780.209, "dur": 8053.589, + "args": { + "External id": 227231,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115361057.806, "dur": 30.962, + "args": { + "External id": 227232,"Sequence number": 2757775, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6031 + } + }, + { + "ph": "s", "id": 181, "pid": 4183442, "tid": 4183442, "ts": 667115361057.806, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115361076.246, "dur": 7.738, + "args": { + "External id": 227233,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115361079.348, "dur": 4.405, + "args": { + "External id": 227234,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115361153.691, "dur": 84.826, + "args": { + "External id": 227235,"Record function id": 0, "Ev Idx": 6034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115361240.173, "dur": 1106.613, + "args": { + "External id": 227236,"Record function id": 0, "Ev Idx": 6035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115361282.186, "dur": 1051.273, + "args": { + "External id": 227237,"Sequence number": 2757776, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6036 + } + }, + { + "ph": "s", "id": 180, "pid": 4183442, "tid": 4183442, "ts": 667115361282.186, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115361346.158, "dur": 39.552, + "args": { + "External id": 227238,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115361399.470, "dur": 88.656, + "args": { + "External id": 227239,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115361516.403, "dur": 40.617, + "args": { + "External id": 227240,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115361567.047, "dur": 28.967, + "args": { + "External id": 227241,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115361622.928, "dur": 60.444, + "args": { + "External id": 227242,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115361705.303, "dur": 20.234, + "args": { + "External id": 227243,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115361743.792, "dur": 133.145, + "args": { + "External id": 227244,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115361796.548, "dur": 12.966, + "args": { + "External id": 227245,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115361801.461, "dur": 7.241, + "args": { + "External id": 227246,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115361812.005, "dur": 6.260, + "args": { + "External id": 227247,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115361819.548, "dur": 1.875, + "args": { + "External id": 227248,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115361823.574, "dur": 3.508, + "args": { + "External id": 227249,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115361888.242, "dur": 51.901, + "args": { + "External id": 227250,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115361971.196, "dur": 33.031, + "args": { + "External id": 227251,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115362012.555, "dur": 38.323, + "args": { + "External id": 227252,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115362059.611, "dur": 49.712, + "args": { + "External id": 227253,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115362130.740, "dur": 32.365, + "args": { + "External id": 227254,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115362169.709, "dur": 47.866, + "args": { + "External id": 227255,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115362239.356, "dur": 20.121, + "args": { + "External id": 227256,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6055 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.15)", "pid": 4183442, "tid": 4183442, + "ts": 667115362410.463, "dur": 77.056, + "args": { + "External id": 227257,"Record function id": 0, "Ev Idx": 6056 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115362581.175, "dur": 49.105, + "args": { + "External id": 227258,"Record function id": 0, "Ev Idx": 6057 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.16)", "pid": 4183442, "tid": 4183442, + "ts": 667115362639.942, "dur": 9527.583, + "args": { + "External id": 227259,"Record function id": 0, "Ev Idx": 6058 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 4183442, "tid": 4183442, + "ts": 667115362649.598, "dur": 970.309, + "args": { + "External id": 227260,"Record function id": 0, "Ev Idx": 6059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115362775.633, "dur": 9.857, + "args": { + "External id": 227261,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115362799.130, "dur": 39.060, + "args": { + "External id": 227262,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362804.770, "dur": 2.228, + "args": { + "External id": 227263,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362811.601, "dur": 0.771, + "args": { + "External id": 227264,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362813.698, "dur": 0.915, + "args": { + "External id": 227265,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362816.071, "dur": 0.895, + "args": { + "External id": 227266,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362820.171, "dur": 0.674, + "args": { + "External id": 227267,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362822.282, "dur": 0.712, + "args": { + "External id": 227268,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362824.558, "dur": 2.408, + "args": { + "External id": 227269,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362828.375, "dur": 0.564, + "args": { + "External id": 227270,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362830.155, "dur": 0.558, + "args": { + "External id": 227271,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115362851.957, "dur": 40.507, + "args": { + "External id": 227272,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115362925.616, "dur": 109.767, + "args": { + "External id": 227273,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115362936.874, "dur": 6.984, + "args": { + "External id": 227274,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115362949.074, "dur": 10.424, + "args": { + "External id": 227275,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115362953.377, "dur": 5.533, + "args": { + "External id": 227276,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362956.702, "dur": 0.873, + "args": { + "External id": 227277,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115362966.149, "dur": 29.113, + "args": { + "External id": 227278,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362968.257, "dur": 0.706, + "args": { + "External id": 227279,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362970.627, "dur": 2.936, + "args": { + "External id": 227280,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362974.832, "dur": 0.765, + "args": { + "External id": 227281,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362976.846, "dur": 0.641, + "args": { + "External id": 227282,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362980.578, "dur": 0.456, + "args": { + "External id": 227283,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362982.424, "dur": 0.612, + "args": { + "External id": 227284,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362984.328, "dur": 0.589, + "args": { + "External id": 227285,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362988.066, "dur": 0.700, + "args": { + "External id": 227286,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115362989.742, "dur": 0.692, + "args": { + "External id": 227287,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115363005.911, "dur": 21.332, + "args": { + "External id": 227288,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115363087.815, "dur": 428.771, + "args": { + "External id": 227289,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115363114.516, "dur": 395.396, + "args": { + "External id": 227290,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6089, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115363124.413, "dur": 357.469, + "args": { + "External id": 227291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115363539.517, "dur": 3.679, + "args": { + "External id": 227292,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6091, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 4183442, "tid": 4183442, + "ts": 667115363643.328, "dur": 8326.549, + "args": { + "External id": 227293,"Record function id": 0, "Ev Idx": 6092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363802.285, "dur": 7.627, + "args": { + "External id": 227294,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363813.498, "dur": 1.426, + "args": { + "External id": 227295,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363816.687, "dur": 1.353, + "args": { + "External id": 227296,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363819.918, "dur": 1.193, + "args": { + "External id": 227297,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363822.947, "dur": 1.950, + "args": { + "External id": 227298,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363826.671, "dur": 1.273, + "args": { + "External id": 227299,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363829.837, "dur": 1.329, + "args": { + "External id": 227300,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363832.964, "dur": 2.494, + "args": { + "External id": 227301,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363837.216, "dur": 1.149, + "args": { + "External id": 227302,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115363840.091, "dur": 0.949, + "args": { + "External id": 227303,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115363860.724, "dur": 8070.910, + "args": { + "External id": 227304,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115363877.580, "dur": 8047.550, + "args": { + "External id": 227305,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115363892.675, "dur": 15.414, + "args": { + "External id": 227306,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115363910.793, "dur": 7982.374, + "args": { + "External id": 227307,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115363913.256, "dur": 7979.486, + "args": { + "External id": 227308,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115363920.038, "dur": 7.518, + "args": { + "External id": 227309,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115363929.240, "dur": 7960.791, + "args": { + "External id": 227310,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115372113.552, "dur": 29.345, + "args": { + "External id": 227311,"Sequence number": 2757777, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6110 + } + }, + { + "ph": "s", "id": 179, "pid": 4183442, "tid": 4183442, "ts": 667115372113.552, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115372129.810, "dur": 7.984, + "args": { + "External id": 227312,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115372132.994, "dur": 4.595, + "args": { + "External id": 227313,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115372208.978, "dur": 85.260, + "args": { + "External id": 227314,"Record function id": 0, "Ev Idx": 6113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115372296.000, "dur": 1124.341, + "args": { + "External id": 227315,"Record function id": 0, "Ev Idx": 6114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115372335.500, "dur": 1071.311, + "args": { + "External id": 227316,"Sequence number": 2757778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6115 + } + }, + { + "ph": "s", "id": 178, "pid": 4183442, "tid": 4183442, "ts": 667115372335.500, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115372399.618, "dur": 41.499, + "args": { + "External id": 227317,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115372455.499, "dur": 109.214, + "args": { + "External id": 227318,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115372576.986, "dur": 37.064, + "args": { + "External id": 227319,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115372623.150, "dur": 63.541, + "args": { + "External id": 227320,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115372721.341, "dur": 33.374, + "args": { + "External id": 227321,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115372771.593, "dur": 17.296, + "args": { + "External id": 227322,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115372806.777, "dur": 136.899, + "args": { + "External id": 227323,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115372860.293, "dur": 11.793, + "args": { + "External id": 227324,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115372865.482, "dur": 5.857, + "args": { + "External id": 227325,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115372874.779, "dur": 6.510, + "args": { + "External id": 227326,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115372882.886, "dur": 1.746, + "args": { + "External id": 227327,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115372886.808, "dur": 5.545, + "args": { + "External id": 227328,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115372981.752, "dur": 54.953, + "args": { + "External id": 227329,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115373070.482, "dur": 29.128, + "args": { + "External id": 227330,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115373108.210, "dur": 42.208, + "args": { + "External id": 227331,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115373159.608, "dur": 45.620, + "args": { + "External id": 227332,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115373226.668, "dur": 26.622, + "args": { + "External id": 227333,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115373259.342, "dur": 40.930, + "args": { + "External id": 227334,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115373320.323, "dur": 18.559, + "args": { + "External id": 227335,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6134 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.16)", "pid": 4183442, "tid": 4183442, + "ts": 667115373483.866, "dur": 99.015, + "args": { + "External id": 227336,"Record function id": 0, "Ev Idx": 6135 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115373696.987, "dur": 52.427, + "args": { + "External id": 227337,"Record function id": 0, "Ev Idx": 6136 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.17)", "pid": 4183442, "tid": 4183442, + "ts": 667115373760.316, "dur": 9214.903, + "args": { + "External id": 227338,"Record function id": 0, "Ev Idx": 6137 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 4183442, "tid": 4183442, + "ts": 667115373768.493, "dur": 869.807, + "args": { + "External id": 227339,"Record function id": 0, "Ev Idx": 6138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115373850.838, "dur": 9.962, + "args": { + "External id": 227340,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115373875.004, "dur": 37.158, + "args": { + "External id": 227341,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373880.088, "dur": 2.218, + "args": { + "External id": 227342,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373886.833, "dur": 0.840, + "args": { + "External id": 227343,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373888.975, "dur": 0.614, + "args": { + "External id": 227344,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373891.242, "dur": 0.585, + "args": { + "External id": 227345,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373894.911, "dur": 0.652, + "args": { + "External id": 227346,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373896.956, "dur": 0.763, + "args": { + "External id": 227347,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373898.748, "dur": 2.651, + "args": { + "External id": 227348,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373903.063, "dur": 0.749, + "args": { + "External id": 227349,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115373904.781, "dur": 0.606, + "args": { + "External id": 227350,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115373924.746, "dur": 41.706, + "args": { + "External id": 227351,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115373998.152, "dur": 109.223, + "args": { + "External id": 227352,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115374008.490, "dur": 4.604, + "args": { + "External id": 227353,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115374017.834, "dur": 9.909, + "args": { + "External id": 227354,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115374022.126, "dur": 5.216, + "args": { + "External id": 227355,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374025.401, "dur": 0.720, + "args": { + "External id": 227356,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115374034.547, "dur": 30.436, + "args": { + "External id": 227357,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374036.644, "dur": 2.758, + "args": { + "External id": 227358,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374041.304, "dur": 0.604, + "args": { + "External id": 227359,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374042.925, "dur": 0.894, + "args": { + "External id": 227360,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374047.478, "dur": 0.550, + "args": { + "External id": 227361,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374049.124, "dur": 0.388, + "args": { + "External id": 227362,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374051.059, "dur": 0.648, + "args": { + "External id": 227363,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374054.472, "dur": 0.839, + "args": { + "External id": 227364,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374056.371, "dur": 0.449, + "args": { + "External id": 227365,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374057.818, "dur": 2.049, + "args": { + "External id": 227366,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115374077.751, "dur": 21.588, + "args": { + "External id": 227367,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115374158.597, "dur": 383.097, + "args": { + "External id": 227368,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115374182.987, "dur": 353.056, + "args": { + "External id": 227369,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6168, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115374192.796, "dur": 337.404, + "args": { + "External id": 227370,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115374563.508, "dur": 2.386, + "args": { + "External id": 227371,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6170, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 4183442, "tid": 4183442, + "ts": 667115374696.330, "dur": 8088.831, + "args": { + "External id": 227372,"Record function id": 0, "Ev Idx": 6171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374801.750, "dur": 7.147, + "args": { + "External id": 227373,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374812.265, "dur": 1.576, + "args": { + "External id": 227374,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374815.357, "dur": 1.213, + "args": { + "External id": 227375,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374818.025, "dur": 1.349, + "args": { + "External id": 227376,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374820.925, "dur": 1.348, + "args": { + "External id": 227377,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374824.096, "dur": 1.520, + "args": { + "External id": 227378,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374827.492, "dur": 1.249, + "args": { + "External id": 227379,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374830.329, "dur": 2.807, + "args": { + "External id": 227380,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374834.682, "dur": 1.200, + "args": { + "External id": 227381,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115374837.498, "dur": 1.231, + "args": { + "External id": 227382,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115374856.585, "dur": 7892.337, + "args": { + "External id": 227383,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115374871.327, "dur": 7871.132, + "args": { + "External id": 227384,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115374887.880, "dur": 14.796, + "args": { + "External id": 227385,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115374905.300, "dur": 7807.937, + "args": { + "External id": 227386,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115374907.867, "dur": 7804.904, + "args": { + "External id": 227387,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115374914.323, "dur": 7.280, + "args": { + "External id": 227388,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115374923.407, "dur": 7786.521, + "args": { + "External id": 227389,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115382922.648, "dur": 28.914, + "args": { + "External id": 227390,"Sequence number": 2757779, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6189 + } + }, + { + "ph": "s", "id": 177, "pid": 4183442, "tid": 4183442, "ts": 667115382922.648, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115382939.188, "dur": 7.420, + "args": { + "External id": 227391,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115382942.078, "dur": 4.290, + "args": { + "External id": 227392,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115383013.541, "dur": 84.557, + "args": { + "External id": 227393,"Record function id": 0, "Ev Idx": 6192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115383099.693, "dur": 1094.957, + "args": { + "External id": 227394,"Record function id": 0, "Ev Idx": 6193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115383139.111, "dur": 1041.212, + "args": { + "External id": 227395,"Sequence number": 2757780, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6194 + } + }, + { + "ph": "s", "id": 176, "pid": 4183442, "tid": 4183442, "ts": 667115383139.111, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115383202.570, "dur": 38.172, + "args": { + "External id": 227396,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115383254.415, "dur": 87.587, + "args": { + "External id": 227397,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115383351.491, "dur": 34.129, + "args": { + "External id": 227398,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115383394.626, "dur": 29.366, + "args": { + "External id": 227399,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115383449.046, "dur": 26.567, + "args": { + "External id": 227400,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115383512.533, "dur": 18.620, + "args": { + "External id": 227401,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115383550.309, "dur": 166.599, + "args": { + "External id": 227402,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115383601.149, "dur": 11.712, + "args": { + "External id": 227403,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115383605.597, "dur": 6.490, + "args": { + "External id": 227404,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115383615.630, "dur": 6.184, + "args": { + "External id": 227405,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115383623.159, "dur": 1.820, + "args": { + "External id": 227406,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115383627.040, "dur": 2.726, + "args": { + "External id": 227407,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115383730.683, "dur": 55.159, + "args": { + "External id": 227408,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115383819.913, "dur": 28.776, + "args": { + "External id": 227409,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115383857.729, "dur": 39.179, + "args": { + "External id": 227410,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115383906.527, "dur": 50.665, + "args": { + "External id": 227411,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115383979.026, "dur": 29.397, + "args": { + "External id": 227412,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115384014.936, "dur": 49.166, + "args": { + "External id": 227413,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115384086.024, "dur": 19.747, + "args": { + "External id": 227414,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6213 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.17)", "pid": 4183442, "tid": 4183442, + "ts": 667115384259.018, "dur": 80.345, + "args": { + "External id": 227415,"Record function id": 0, "Ev Idx": 6214 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115384412.658, "dur": 47.567, + "args": { + "External id": 227416,"Record function id": 0, "Ev Idx": 6215 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.18)", "pid": 4183442, "tid": 4183442, + "ts": 667115384468.872, "dur": 9346.854, + "args": { + "External id": 227417,"Record function id": 0, "Ev Idx": 6216 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 4183442, "tid": 4183442, + "ts": 667115384476.962, "dur": 896.879, + "args": { + "External id": 227418,"Record function id": 0, "Ev Idx": 6217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115384581.798, "dur": 10.321, + "args": { + "External id": 227419,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115384605.440, "dur": 37.848, + "args": { + "External id": 227420,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384611.368, "dur": 2.447, + "args": { + "External id": 227421,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384618.704, "dur": 0.466, + "args": { + "External id": 227422,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384620.679, "dur": 0.560, + "args": { + "External id": 227423,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384622.646, "dur": 0.453, + "args": { + "External id": 227424,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384626.322, "dur": 0.534, + "args": { + "External id": 227425,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384628.107, "dur": 0.682, + "args": { + "External id": 227426,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384629.891, "dur": 2.133, + "args": { + "External id": 227427,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384633.424, "dur": 0.690, + "args": { + "External id": 227428,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384635.519, "dur": 0.804, + "args": { + "External id": 227429,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115384689.833, "dur": 41.641, + "args": { + "External id": 227430,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115384766.916, "dur": 116.238, + "args": { + "External id": 227431,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115384781.976, "dur": 7.734, + "args": { + "External id": 227432,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115384794.953, "dur": 11.455, + "args": { + "External id": 227433,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115384799.380, "dur": 6.645, + "args": { + "External id": 227434,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384803.246, "dur": 1.063, + "args": { + "External id": 227435,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115384813.601, "dur": 29.172, + "args": { + "External id": 227436,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384815.523, "dur": 0.613, + "args": { + "External id": 227437,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384817.732, "dur": 2.996, + "args": { + "External id": 227438,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384822.129, "dur": 0.450, + "args": { + "External id": 227439,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384823.649, "dur": 0.785, + "args": { + "External id": 227440,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384828.784, "dur": 0.428, + "args": { + "External id": 227441,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384830.594, "dur": 0.461, + "args": { + "External id": 227442,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384832.537, "dur": 0.636, + "args": { + "External id": 227443,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384836.411, "dur": 0.362, + "args": { + "External id": 227444,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115384838.027, "dur": 0.629, + "args": { + "External id": 227445,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115384853.461, "dur": 21.945, + "args": { + "External id": 227446,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115384936.275, "dur": 351.984, + "args": { + "External id": 227447,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115384962.331, "dur": 321.422, + "args": { + "External id": 227448,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6247, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115384972.531, "dur": 305.685, + "args": { + "External id": 227449,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115385307.121, "dur": 2.098, + "args": { + "External id": 227450,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6249, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 4183442, "tid": 4183442, + "ts": 667115385394.338, "dur": 8195.284, + "args": { + "External id": 227451,"Record function id": 0, "Ev Idx": 6250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385489.924, "dur": 24.854, + "args": { + "External id": 227452,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385520.345, "dur": 1.823, + "args": { + "External id": 227453,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385524.112, "dur": 1.590, + "args": { + "External id": 227454,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385527.612, "dur": 1.200, + "args": { + "External id": 227455,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385530.514, "dur": 1.261, + "args": { + "External id": 227456,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385533.508, "dur": 1.106, + "args": { + "External id": 227457,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385536.726, "dur": 1.148, + "args": { + "External id": 227458,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385540.078, "dur": 2.388, + "args": { + "External id": 227459,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385544.480, "dur": 1.347, + "args": { + "External id": 227460,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115385547.920, "dur": 0.785, + "args": { + "External id": 227461,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115385567.640, "dur": 7983.350, + "args": { + "External id": 227462,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115385582.666, "dur": 7962.093, + "args": { + "External id": 227463,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115385597.393, "dur": 15.864, + "args": { + "External id": 227464,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115385616.288, "dur": 7891.990, + "args": { + "External id": 227465,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115385618.478, "dur": 7889.224, + "args": { + "External id": 227466,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115385625.134, "dur": 5.559, + "args": { + "External id": 227467,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115385632.453, "dur": 7872.368, + "args": { + "External id": 227468,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115393761.536, "dur": 29.437, + "args": { + "External id": 227469,"Sequence number": 2757781, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6268 + } + }, + { + "ph": "s", "id": 175, "pid": 4183442, "tid": 4183442, "ts": 667115393761.536, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115393778.403, "dur": 7.323, + "args": { + "External id": 227470,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115393781.217, "dur": 4.156, + "args": { + "External id": 227471,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115393853.536, "dur": 84.598, + "args": { + "External id": 227472,"Record function id": 0, "Ev Idx": 6271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115393939.997, "dur": 1080.532, + "args": { + "External id": 227473,"Record function id": 0, "Ev Idx": 6272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115393980.072, "dur": 1026.798, + "args": { + "External id": 227474,"Sequence number": 2757782, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6273 + } + }, + { + "ph": "s", "id": 174, "pid": 4183442, "tid": 4183442, "ts": 667115393980.072, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115394047.701, "dur": 44.171, + "args": { + "External id": 227475,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115394108.804, "dur": 90.050, + "args": { + "External id": 227476,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115394207.850, "dur": 33.982, + "args": { + "External id": 227477,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115394248.555, "dur": 29.148, + "args": { + "External id": 227478,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115394303.971, "dur": 23.021, + "args": { + "External id": 227479,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115394342.196, "dur": 16.393, + "args": { + "External id": 227480,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115394373.184, "dur": 148.896, + "args": { + "External id": 227481,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115394421.729, "dur": 12.257, + "args": { + "External id": 227482,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115394426.420, "dur": 6.585, + "args": { + "External id": 227483,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115394437.081, "dur": 4.345, + "args": { + "External id": 227484,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115394442.820, "dur": 3.433, + "args": { + "External id": 227485,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115394448.734, "dur": 3.151, + "args": { + "External id": 227486,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115394535.163, "dur": 48.639, + "args": { + "External id": 227487,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115394618.493, "dur": 28.966, + "args": { + "External id": 227488,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115394694.258, "dur": 43.777, + "args": { + "External id": 227489,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115394746.556, "dur": 37.080, + "args": { + "External id": 227490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115394808.686, "dur": 28.531, + "args": { + "External id": 227491,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115394843.123, "dur": 54.701, + "args": { + "External id": 227492,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115394916.836, "dur": 20.935, + "args": { + "External id": 227493,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6292 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.18)", "pid": 4183442, "tid": 4183442, + "ts": 667115395083.903, "dur": 80.433, + "args": { + "External id": 227494,"Record function id": 0, "Ev Idx": 6293 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183442, "tid": 4183442, + "ts": 667115395236.866, "dur": 48.223, + "args": { + "External id": 227495,"Record function id": 0, "Ev Idx": 6294 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.19)", "pid": 4183442, "tid": 4183442, + "ts": 667115395294.902, "dur": 9269.512, + "args": { + "External id": 227496,"Record function id": 0, "Ev Idx": 6295 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 4183442, "tid": 4183442, + "ts": 667115395303.995, "dur": 907.633, + "args": { + "External id": 227497,"Record function id": 0, "Ev Idx": 6296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115395386.343, "dur": 8.409, + "args": { + "External id": 227498,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115395408.444, "dur": 35.270, + "args": { + "External id": 227499,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395413.717, "dur": 2.316, + "args": { + "External id": 227500,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395420.510, "dur": 0.360, + "args": { + "External id": 227501,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395421.917, "dur": 0.620, + "args": { + "External id": 227502,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395424.005, "dur": 0.384, + "args": { + "External id": 227503,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395427.861, "dur": 0.318, + "args": { + "External id": 227504,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395429.563, "dur": 0.422, + "args": { + "External id": 227505,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395431.243, "dur": 2.540, + "args": { + "External id": 227506,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395435.176, "dur": 0.606, + "args": { + "External id": 227507,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395436.887, "dur": 0.301, + "args": { + "External id": 227508,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115395455.809, "dur": 59.157, + "args": { + "External id": 227509,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183442, "tid": 4183442, + "ts": 667115395550.558, "dur": 157.330, + "args": { + "External id": 227510,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115395561.167, "dur": 5.450, + "args": { + "External id": 227511,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183442, "tid": 4183442, + "ts": 667115395571.763, "dur": 11.650, + "args": { + "External id": 227512,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115395576.619, "dur": 6.384, + "args": { + "External id": 227513,"Record function id": 0, "Concrete Inputs": ["", "0", "9635328", "11241216", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395580.661, "dur": 0.807, + "args": { + "External id": 227514,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183442, "tid": 4183442, + "ts": 667115395590.769, "dur": 31.044, + "args": { + "External id": 227515,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395592.991, "dur": 2.731, + "args": { + "External id": 227516,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9635328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395597.136, "dur": 0.602, + "args": { + "External id": 227517,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9635456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395598.867, "dur": 0.716, + "args": { + "External id": 227518,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9766528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395603.684, "dur": 0.653, + "args": { + "External id": 227519,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9897600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395605.635, "dur": 0.519, + "args": { + "External id": 227520,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "10028672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395607.814, "dur": 0.400, + "args": { + "External id": 227521,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10159744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395610.597, "dur": 0.756, + "args": { + "External id": 227522,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395612.811, "dur": 0.591, + "args": { + "External id": 227523,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10520320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115395614.740, "dur": 2.633, + "args": { + "External id": 227524,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10880768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115395636.596, "dur": 60.755, + "args": { + "External id": 227525,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183442, "tid": 4183442, + "ts": 667115395765.753, "dur": 356.752, + "args": { + "External id": 227526,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115395792.960, "dur": 324.998, + "args": { + "External id": 227527,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6326, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183442, "tid": 4183442, + "ts": 667115395803.275, "dur": 309.685, + "args": { + "External id": 227528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115396141.725, "dur": 2.331, + "args": { + "External id": 227529,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6328, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 4183442, "tid": 4183442, + "ts": 667115396232.546, "dur": 8118.728, + "args": { + "External id": 227530,"Record function id": 0, "Ev Idx": 6329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396334.269, "dur": 5.955, + "args": { + "External id": 227531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396353.043, "dur": 2.213, + "args": { + "External id": 227532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396356.928, "dur": 0.782, + "args": { + "External id": 227533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396359.458, "dur": 1.175, + "args": { + "External id": 227534,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396362.255, "dur": 0.882, + "args": { + "External id": 227535,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396364.255, "dur": 1.008, + "args": { + "External id": 227536,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396366.852, "dur": 0.997, + "args": { + "External id": 227537,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396369.928, "dur": 2.240, + "args": { + "External id": 227538,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396373.980, "dur": 1.691, + "args": { + "External id": 227539,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115396377.374, "dur": 1.241, + "args": { + "External id": 227540,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115396398.213, "dur": 7914.063, + "args": { + "External id": 227541,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115396412.731, "dur": 7893.078, + "args": { + "External id": 227542,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115396426.138, "dur": 14.963, + "args": { + "External id": 227543,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115396443.734, "dur": 7830.489, + "args": { + "External id": 227544,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115396446.030, "dur": 7827.666, + "args": { + "External id": 227545,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115396452.216, "dur": 5.660, + "args": { + "External id": 227546,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115396459.535, "dur": 7811.201, + "args": { + "External id": 227547,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115404488.251, "dur": 48.801, + "args": { + "External id": 227548,"Sequence number": 2757783, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6347 + } + }, + { + "ph": "s", "id": 173, "pid": 4183442, "tid": 4183442, "ts": 667115404488.251, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115404523.471, "dur": 8.264, + "args": { + "External id": 227549,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115404526.802, "dur": 4.594, + "args": { + "External id": 227550,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115404603.222, "dur": 112.619, + "args": { + "External id": 227551,"Record function id": 0, "Ev Idx": 6350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183442, "tid": 4183442, + "ts": 667115404718.941, "dur": 1064.287, + "args": { + "External id": 227552,"Record function id": 0, "Ev Idx": 6351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115404761.211, "dur": 1008.412, + "args": { + "External id": 227553,"Sequence number": 2757784, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6352 + } + }, + { + "ph": "s", "id": 172, "pid": 4183442, "tid": 4183442, "ts": 667115404761.211, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115404832.031, "dur": 43.969, + "args": { + "External id": 227554,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115404891.439, "dur": 93.335, + "args": { + "External id": 227555,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115404993.662, "dur": 33.783, + "args": { + "External id": 227556,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115405037.247, "dur": 29.403, + "args": { + "External id": 227557,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115405091.122, "dur": 26.198, + "args": { + "External id": 227558,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183442, "tid": 4183442, + "ts": 667115405135.162, "dur": 17.176, + "args": { + "External id": 227559,"kernel_hash": "czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/zh/czhnxgjeuzovurdv6xjgegtqa3tjtpwahtepnrfadzfmtmjtx5ag.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115405169.152, "dur": 125.287, + "args": { + "External id": 227560,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115405217.478, "dur": 10.641, + "args": { + "External id": 227561,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115405222.154, "dur": 5.276, + "args": { + "External id": 227562,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115405230.653, "dur": 4.988, + "args": { + "External id": 227563,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115405237.386, "dur": 1.505, + "args": { + "External id": 227564,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115405241.186, "dur": 3.148, + "args": { + "External id": 227565,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115405304.484, "dur": 41.916, + "args": { + "External id": 227566,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183442, "tid": 4183442, + "ts": 667115405377.514, "dur": 29.467, + "args": { + "External id": 227567,"kernel_hash": "cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/op/cop57stup5gnbnrsecowsi4uil2l2kmuphbrgn2q3tgc6eiu4qc5.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115405415.819, "dur": 38.166, + "args": { + "External id": 227568,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115405462.634, "dur": 47.891, + "args": { + "External id": 227569,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183442, "tid": 4183442, + "ts": 667115405536.184, "dur": 27.546, + "args": { + "External id": 227570,"kernel_hash": "cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/r2/cr2bzqlvlabc4i743m6mbivqrhokpbtpv7itjeabxka7r6aei45y.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115405570.869, "dur": 49.963, + "args": { + "External id": 227571,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183442, "tid": 4183442, + "ts": 667115405640.924, "dur": 54.539, + "args": { + "External id": 227572,"kernel_hash": "ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/co/ccow4uofbk47allirjstpav26a22yvntuhmv5eu6472wlpm4kijh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6371 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.19)", "pid": 4183442, "tid": 4183442, + "ts": 667115405849.283, "dur": 32.798, + "args": { + "External id": 227573,"Record function id": 0, "Ev Idx": 6372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115405964.716, "dur": 270.557, + "args": { + "External id": 227574,"Sequence number": 2757785, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6373 + } + }, + { + "ph": "s", "id": 171, "pid": 4183442, "tid": 4183442, "ts": 667115405964.716, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115405994.616, "dur": 8.284, + "args": { + "External id": 227575,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115405996.835, "dur": 5.803, + "args": { + "External id": 227576,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115406012.027, "dur": 11.634, + "args": { + "External id": 227577,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115406014.852, "dur": 8.212, + "args": { + "External id": 227578,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115406031.586, "dur": 5.145, + "args": { + "External id": 227579,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115406217.764, "dur": 6.144, + "args": { + "External id": 227580,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115406221.347, "dur": 2.355, + "args": { + "External id": 227581,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115406264.641, "dur": 129.080, + "args": { + "External id": 227582,"Sequence number": 2757786, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115406267.442, "dur": 13.552, + "args": { + "External id": 227583,"Sequence number": 2757786, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6382 + } + }, + { + "ph": "s", "id": 170, "pid": 4183442, "tid": 4183442, "ts": 667115406267.442, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115406273.185, "dur": 6.110, + "args": { + "External id": 227584,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115406276.928, "dur": 2.042, + "args": { + "External id": 227585,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115406283.914, "dur": 109.454, + "args": { + "External id": 227586,"Sequence number": 2757787, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115406286.888, "dur": 5.622, + "args": { + "External id": 227587,"Sequence number": 2757787, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115406288.439, "dur": 3.922, + "args": { + "External id": 227588,"Sequence number": 2757787, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6387 + } + }, + { + "ph": "s", "id": 169, "pid": 4183442, "tid": 4183442, "ts": 667115406288.439, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115406294.769, "dur": 88.338, + "args": { + "External id": 227589,"Sequence number": 2757788, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6388 + } + }, + { + "ph": "s", "id": 168, "pid": 4183442, "tid": 4183442, "ts": 667115406294.769, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115406386.436, "dur": 5.596, + "args": { + "External id": 227590,"Sequence number": 2757789, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6389 + } + }, + { + "ph": "s", "id": 167, "pid": 4183442, "tid": 4183442, "ts": 667115406386.436, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115406404.386, "dur": 67.720, + "args": { + "External id": 227591,"Sequence number": 2757790, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115406405.925, "dur": 7.003, + "args": { + "External id": 227592,"Sequence number": 2757790, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6391 + } + }, + { + "ph": "s", "id": 166, "pid": 4183442, "tid": 4183442, "ts": 667115406405.925, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115406408.829, "dur": 3.127, + "args": { + "External id": 227593,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115406410.795, "dur": 0.897, + "args": { + "External id": 227594,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115406414.102, "dur": 57.794, + "args": { + "External id": 227595,"Sequence number": 2757791, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115406415.552, "dur": 6.509, + "args": { + "External id": 227596,"Sequence number": 2757791, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115406416.642, "dur": 5.239, + "args": { + "External id": 227597,"Sequence number": 2757791, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6396 + } + }, + { + "ph": "s", "id": 165, "pid": 4183442, "tid": 4183442, "ts": 667115406416.642, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115406423.003, "dur": 42.055, + "args": { + "External id": 227598,"Sequence number": 2757792, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6397 + } + }, + { + "ph": "s", "id": 164, "pid": 4183442, "tid": 4183442, "ts": 667115406423.003, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115406466.663, "dur": 4.670, + "args": { + "External id": 227599,"Sequence number": 2757793, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6398 + } + }, + { + "ph": "s", "id": 163, "pid": 4183442, "tid": 4183442, "ts": 667115406466.663, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115406479.710, "dur": 91.005, + "args": { + "External id": 227600,"Sequence number": 2757794, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115406480.743, "dur": 6.739, + "args": { + "External id": 227601,"Sequence number": 2757794, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6400 + } + }, + { + "ph": "s", "id": 162, "pid": 4183442, "tid": 4183442, "ts": 667115406480.743, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115406482.994, "dur": 3.273, + "args": { + "External id": 227602,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115406484.810, "dur": 1.124, + "args": { + "External id": 227603,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115406488.476, "dur": 82.040, + "args": { + "External id": 227604,"Sequence number": 2757795, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115406489.961, "dur": 27.290, + "args": { + "External id": 227605,"Sequence number": 2757795, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115406511.682, "dur": 5.302, + "args": { + "External id": 227606,"Sequence number": 2757795, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6405 + } + }, + { + "ph": "s", "id": 161, "pid": 4183442, "tid": 4183442, "ts": 667115406511.682, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115406518.162, "dur": 45.259, + "args": { + "External id": 227607,"Sequence number": 2757796, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6406 + } + }, + { + "ph": "s", "id": 160, "pid": 4183442, "tid": 4183442, "ts": 667115406518.162, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115406565.561, "dur": 4.489, + "args": { + "External id": 227608,"Sequence number": 2757797, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6407 + } + }, + { + "ph": "s", "id": 159, "pid": 4183442, "tid": 4183442, "ts": 667115406565.561, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115406593.728, "dur": 3.926, + "args": { + "External id": 227609,"Sequence number": 2757798, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115406594.724, "dur": 2.811, + "args": { + "External id": 227610,"Sequence number": 2757798, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6409 + } + }, + { + "ph": "s", "id": 158, "pid": 4183442, "tid": 4183442, "ts": 667115406594.724, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115406607.539, "dur": 5.654, + "args": { + "External id": 227611,"Sequence number": 2757799, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115406608.793, "dur": 4.253, + "args": { + "External id": 227612,"Sequence number": 2757799, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6411 + } + }, + { + "ph": "s", "id": 157, "pid": 4183442, "tid": 4183442, "ts": 667115406608.793, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115406617.800, "dur": 2.899, + "args": { + "External id": 227613,"Sequence number": 2757800, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115406618.740, "dur": 1.817, + "args": { + "External id": 227614,"Sequence number": 2757800, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6413 + } + }, + { + "ph": "s", "id": 156, "pid": 4183442, "tid": 4183442, "ts": 667115406618.740, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115406694.022, "dur": 190.717, + "args": { + "External id": 227615,"Sequence number": 2757801, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6414 + } + }, + { + "ph": "s", "id": 155, "pid": 4183442, "tid": 4183442, "ts": 667115406694.022, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115406719.379, "dur": 10.219, + "args": { + "External id": 227616,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115406722.416, "dur": 6.552, + "args": { + "External id": 227617,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115406901.363, "dur": 106.560, + "args": { + "External id": 227618,"Sequence number": 2757802, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6417 + } + }, + { + "ph": "s", "id": 154, "pid": 4183442, "tid": 4183442, "ts": 667115406901.363, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115406915.399, "dur": 7.624, + "args": { + "External id": 227619,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115406917.446, "dur": 5.118, + "args": { + "External id": 227620,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183442, "tid": 4183442, + "ts": 667115407039.175, "dur": 186.992, + "args": { + "External id": 227621,"Sequence number": 2757803, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6420 + } + }, + { + "ph": "s", "id": 153, "pid": 4183442, "tid": 4183442, "ts": 667115407039.175, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115407069.696, "dur": 128.031, + "args": { + "External id": 227622,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115407120.921, "dur": 7.172, + "args": { + "External id": 227623,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115407123.088, "dur": 4.419, + "args": { + "External id": 227624,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115407130.778, "dur": 4.130, + "args": { + "External id": 227625,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115407136.277, "dur": 1.720, + "args": { + "External id": 227626,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115407140.603, "dur": 5.211, + "args": { + "External id": 227627,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 4183442, + "ts": 667115407211.376, "dur": 5.614, + "args": { + "External id": 227628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407231.744, "dur": 6.254, + "args": { + "External id": 227629,"Sequence number": 2757804, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407233.508, "dur": 4.302, + "args": { + "External id": 227630,"Sequence number": 2757804, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6429 + } + }, + { + "ph": "s", "id": 152, "pid": 4183442, "tid": 4183442, "ts": 667115407233.508, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115407250.670, "dur": 109.702, + "args": { + "External id": 227631,"Sequence number": 2757805, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115407252.232, "dur": 8.964, + "args": { + "External id": 227632,"Sequence number": 2757805, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6431 + } + }, + { + "ph": "s", "id": 151, "pid": 4183442, "tid": 4183442, "ts": 667115407252.232, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115407254.974, "dur": 5.068, + "args": { + "External id": 227633,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115407258.039, "dur": 1.712, + "args": { + "External id": 227634,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115407262.589, "dur": 97.428, + "args": { + "External id": 227635,"Sequence number": 2757806, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407264.811, "dur": 5.588, + "args": { + "External id": 227636,"Sequence number": 2757806, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407266.179, "dur": 4.077, + "args": { + "External id": 227637,"Sequence number": 2757806, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6436 + } + }, + { + "ph": "s", "id": 150, "pid": 4183442, "tid": 4183442, "ts": 667115407266.179, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115407271.577, "dur": 81.929, + "args": { + "External id": 227638,"Sequence number": 2757807, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6437 + } + }, + { + "ph": "s", "id": 149, "pid": 4183442, "tid": 4183442, "ts": 667115407271.577, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115407356.073, "dur": 3.236, + "args": { + "External id": 227639,"Sequence number": 2757808, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6438 + } + }, + { + "ph": "s", "id": 148, "pid": 4183442, "tid": 4183442, "ts": 667115407356.073, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115407393.643, "dur": 244.777, + "args": { + "External id": 227640,"Sequence number": 2757809, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6439 + } + }, + { + "ph": "s", "id": 147, "pid": 4183442, "tid": 4183442, "ts": 667115407393.643, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407411.689, "dur": 2.807, + "args": { + "External id": 227641,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407412.989, "dur": 1.374, + "args": { + "External id": 227642,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183442, "tid": 4183442, + "ts": 667115407420.657, "dur": 4.036, + "args": { + "External id": 227643,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407422.058, "dur": 2.522, + "args": { + "External id": 227644,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407423.149, "dur": 1.318, + "args": { + "External id": 227645,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115407432.189, "dur": 7.610, + "args": { + "External id": 227646,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115407434.970, "dur": 4.378, + "args": { + "External id": 227647,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115407446.008, "dur": 3.556, + "args": { + "External id": 227648,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115407453.124, "dur": 4.618, + "args": { + "External id": 227649,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407613.145, "dur": 6.731, + "args": { + "External id": 227650,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407614.540, "dur": 5.036, + "args": { + "External id": 227651,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407623.071, "dur": 2.574, + "args": { + "External id": 227652,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407624.236, "dur": 1.307, + "args": { + "External id": 227653,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115407697.843, "dur": 121.154, + "args": { + "External id": 227654,"Sequence number": 2757810, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115407699.275, "dur": 10.512, + "args": { + "External id": 227655,"Sequence number": 2757810, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6454 + } + }, + { + "ph": "s", "id": 146, "pid": 4183442, "tid": 4183442, "ts": 667115407699.275, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115407703.232, "dur": 5.006, + "args": { + "External id": 227656,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115407705.919, "dur": 1.905, + "args": { + "External id": 227657,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115407710.904, "dur": 107.739, + "args": { + "External id": 227658,"Sequence number": 2757811, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407712.949, "dur": 6.010, + "args": { + "External id": 227659,"Sequence number": 2757811, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407714.119, "dur": 4.710, + "args": { + "External id": 227660,"Sequence number": 2757811, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6459 + } + }, + { + "ph": "s", "id": 145, "pid": 4183442, "tid": 4183442, "ts": 667115407714.119, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115407719.826, "dur": 92.941, + "args": { + "External id": 227661,"Sequence number": 2757812, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6460 + } + }, + { + "ph": "s", "id": 144, "pid": 4183442, "tid": 4183442, "ts": 667115407719.826, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115407814.806, "dur": 3.091, + "args": { + "External id": 227662,"Sequence number": 2757813, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6461 + } + }, + { + "ph": "s", "id": 143, "pid": 4183442, "tid": 4183442, "ts": 667115407814.806, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115407828.642, "dur": 70.919, + "args": { + "External id": 227663,"Sequence number": 2757814, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115407829.684, "dur": 8.858, + "args": { + "External id": 227664,"Sequence number": 2757814, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6463 + } + }, + { + "ph": "s", "id": 142, "pid": 4183442, "tid": 4183442, "ts": 667115407829.684, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115407831.895, "dur": 5.446, + "args": { + "External id": 227665,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115407836.106, "dur": 1.097, + "args": { + "External id": 227666,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115407839.171, "dur": 60.120, + "args": { + "External id": 227667,"Sequence number": 2757815, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115407840.719, "dur": 4.970, + "args": { + "External id": 227668,"Sequence number": 2757815, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115407841.599, "dur": 3.931, + "args": { + "External id": 227669,"Sequence number": 2757815, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6468 + } + }, + { + "ph": "s", "id": 141, "pid": 4183442, "tid": 4183442, "ts": 667115407841.599, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115407846.418, "dur": 45.926, + "args": { + "External id": 227670,"Sequence number": 2757816, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6469 + } + }, + { + "ph": "s", "id": 140, "pid": 4183442, "tid": 4183442, "ts": 667115407846.418, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115407894.542, "dur": 4.431, + "args": { + "External id": 227671,"Sequence number": 2757817, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6470 + } + }, + { + "ph": "s", "id": 139, "pid": 4183442, "tid": 4183442, "ts": 667115407894.542, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115407923.433, "dur": 154.304, + "args": { + "External id": 227672,"Sequence number": 2757818, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6471 + } + }, + { + "ph": "s", "id": 138, "pid": 4183442, "tid": 4183442, "ts": 667115407923.433, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115407966.826, "dur": 4.695, + "args": { + "External id": 227673,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115408006.267, "dur": 56.449, + "args": { + "External id": 227674,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115408006.946, "dur": 5.543, + "args": { + "External id": 227675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115408008.439, "dur": 3.088, + "args": { + "External id": 227676,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115408010.215, "dur": 0.993, + "args": { + "External id": 227677,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115408013.175, "dur": 49.208, + "args": { + "External id": 227678,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408015.412, "dur": 3.068, + "args": { + "External id": 227679,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408016.797, "dur": 1.558, + "args": { + "External id": 227680,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115408019.299, "dur": 39.183, + "args": { + "External id": 227681,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115408060.548, "dur": 1.309, + "args": { + "External id": 227682,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115408088.276, "dur": 26.386, + "args": { + "External id": 227683,"Sequence number": 2757819, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6482 + } + }, + { + "ph": "s", "id": 137, "pid": 4183442, "tid": 4183442, "ts": 667115408088.276, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115408149.155, "dur": 179.113, + "args": { + "External id": 227684,"Sequence number": 2757820, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6483 + } + }, + { + "ph": "s", "id": 136, "pid": 4183442, "tid": 4183442, "ts": 667115408149.155, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408170.468, "dur": 3.476, + "args": { + "External id": 227685,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408171.721, "dur": 2.037, + "args": { + "External id": 227686,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115408181.232, "dur": 7.215, + "args": { + "External id": 227687,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115408183.964, "dur": 4.096, + "args": { + "External id": 227688,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115408193.931, "dur": 3.448, + "args": { + "External id": 227689,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408312.930, "dur": 5.581, + "args": { + "External id": 227690,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408316.548, "dur": 1.728, + "args": { + "External id": 227691,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115408346.291, "dur": 79.225, + "args": { + "External id": 227692,"Sequence number": 2757821, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115408347.590, "dur": 6.880, + "args": { + "External id": 227693,"Sequence number": 2757821, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6492 + } + }, + { + "ph": "s", "id": 135, "pid": 4183442, "tid": 4183442, "ts": 667115408347.590, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115408350.090, "dur": 3.092, + "args": { + "External id": 227694,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115408351.883, "dur": 1.088, + "args": { + "External id": 227695,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115408355.424, "dur": 69.848, + "args": { + "External id": 227696,"Sequence number": 2757822, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408357.188, "dur": 4.658, + "args": { + "External id": 227697,"Sequence number": 2757822, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408358.335, "dur": 3.331, + "args": { + "External id": 227698,"Sequence number": 2757822, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6497 + } + }, + { + "ph": "s", "id": 134, "pid": 4183442, "tid": 4183442, "ts": 667115408358.335, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115408362.738, "dur": 57.372, + "args": { + "External id": 227699,"Sequence number": 2757823, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6498 + } + }, + { + "ph": "s", "id": 133, "pid": 4183442, "tid": 4183442, "ts": 667115408362.738, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115408422.049, "dur": 2.727, + "args": { + "External id": 227700,"Sequence number": 2757824, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6499 + } + }, + { + "ph": "s", "id": 132, "pid": 4183442, "tid": 4183442, "ts": 667115408422.049, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115408433.703, "dur": 86.778, + "args": { + "External id": 227701,"Sequence number": 2757825, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115408434.404, "dur": 8.714, + "args": { + "External id": 227702,"Sequence number": 2757825, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6501 + } + }, + { + "ph": "s", "id": 131, "pid": 4183442, "tid": 4183442, "ts": 667115408434.404, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115408438.820, "dur": 3.124, + "args": { + "External id": 227703,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115408440.701, "dur": 1.102, + "args": { + "External id": 227704,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115408443.693, "dur": 76.525, + "args": { + "External id": 227705,"Sequence number": 2757826, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408445.251, "dur": 6.675, + "args": { + "External id": 227706,"Sequence number": 2757826, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408446.457, "dur": 5.306, + "args": { + "External id": 227707,"Sequence number": 2757826, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6506 + } + }, + { + "ph": "s", "id": 130, "pid": 4183442, "tid": 4183442, "ts": 667115408446.457, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115408452.764, "dur": 57.908, + "args": { + "External id": 227708,"Sequence number": 2757827, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6507 + } + }, + { + "ph": "s", "id": 129, "pid": 4183442, "tid": 4183442, "ts": 667115408452.764, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115408514.220, "dur": 5.454, + "args": { + "External id": 227709,"Sequence number": 2757828, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6508 + } + }, + { + "ph": "s", "id": 128, "pid": 4183442, "tid": 4183442, "ts": 667115408514.220, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115408530.111, "dur": 62.292, + "args": { + "External id": 227710,"Sequence number": 2757829, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115408530.984, "dur": 6.813, + "args": { + "External id": 227711,"Sequence number": 2757829, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6510 + } + }, + { + "ph": "s", "id": 127, "pid": 4183442, "tid": 4183442, "ts": 667115408530.984, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115408533.372, "dur": 3.285, + "args": { + "External id": 227712,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115408535.647, "dur": 0.846, + "args": { + "External id": 227713,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115408538.799, "dur": 53.349, + "args": { + "External id": 227714,"Sequence number": 2757830, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408540.151, "dur": 5.022, + "args": { + "External id": 227715,"Sequence number": 2757830, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408541.281, "dur": 3.770, + "args": { + "External id": 227716,"Sequence number": 2757830, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6515 + } + }, + { + "ph": "s", "id": 126, "pid": 4183442, "tid": 4183442, "ts": 667115408541.281, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115408545.679, "dur": 41.874, + "args": { + "External id": 227717,"Sequence number": 2757831, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6516 + } + }, + { + "ph": "s", "id": 125, "pid": 4183442, "tid": 4183442, "ts": 667115408545.679, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115408589.675, "dur": 2.067, + "args": { + "External id": 227718,"Sequence number": 2757832, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6517 + } + }, + { + "ph": "s", "id": 124, "pid": 4183442, "tid": 4183442, "ts": 667115408589.675, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408609.124, "dur": 4.072, + "args": { + "External id": 227719,"Sequence number": 2757833, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408610.194, "dur": 2.879, + "args": { + "External id": 227720,"Sequence number": 2757833, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6519 + } + }, + { + "ph": "s", "id": 123, "pid": 4183442, "tid": 4183442, "ts": 667115408610.194, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408619.601, "dur": 5.212, + "args": { + "External id": 227721,"Sequence number": 2757834, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408620.594, "dur": 4.073, + "args": { + "External id": 227722,"Sequence number": 2757834, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6521 + } + }, + { + "ph": "s", "id": 122, "pid": 4183442, "tid": 4183442, "ts": 667115408620.594, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115408629.150, "dur": 6.151, + "args": { + "External id": 227723,"Sequence number": 2757835, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115408630.435, "dur": 4.716, + "args": { + "External id": 227724,"Sequence number": 2757835, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6523 + } + }, + { + "ph": "s", "id": 121, "pid": 4183442, "tid": 4183442, "ts": 667115408630.435, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115408699.517, "dur": 159.992, + "args": { + "External id": 227725,"Sequence number": 2757836, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6524 + } + }, + { + "ph": "s", "id": 120, "pid": 4183442, "tid": 4183442, "ts": 667115408699.517, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115408720.722, "dur": 8.946, + "args": { + "External id": 227726,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115408723.394, "dur": 5.716, + "args": { + "External id": 227727,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115408873.279, "dur": 104.528, + "args": { + "External id": 227728,"Sequence number": 2757837, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6527 + } + }, + { + "ph": "s", "id": 119, "pid": 4183442, "tid": 4183442, "ts": 667115408873.279, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115408887.093, "dur": 8.226, + "args": { + "External id": 227729,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115408889.573, "dur": 5.367, + "args": { + "External id": 227730,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183442, "tid": 4183442, + "ts": 667115409006.264, "dur": 174.323, + "args": { + "External id": 227731,"Sequence number": 2757838, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6530 + } + }, + { + "ph": "s", "id": 118, "pid": 4183442, "tid": 4183442, "ts": 667115409006.264, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115409032.367, "dur": 123.542, + "args": { + "External id": 227732,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115409081.905, "dur": 7.533, + "args": { + "External id": 227733,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115409084.214, "dur": 4.660, + "args": { + "External id": 227734,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115409091.828, "dur": 3.969, + "args": { + "External id": 227735,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115409097.480, "dur": 1.520, + "args": { + "External id": 227736,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115409103.807, "dur": 2.963, + "args": { + "External id": 227737,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 4183442, + "ts": 667115409167.524, "dur": 4.482, + "args": { + "External id": 227738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409185.729, "dur": 6.398, + "args": { + "External id": 227739,"Sequence number": 2757839, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409187.378, "dur": 4.611, + "args": { + "External id": 227740,"Sequence number": 2757839, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6539 + } + }, + { + "ph": "s", "id": 117, "pid": 4183442, "tid": 4183442, "ts": 667115409187.378, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115409205.818, "dur": 109.186, + "args": { + "External id": 227741,"Sequence number": 2757840, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115409207.578, "dur": 9.088, + "args": { + "External id": 227742,"Sequence number": 2757840, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6541 + } + }, + { + "ph": "s", "id": 116, "pid": 4183442, "tid": 4183442, "ts": 667115409207.578, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115409210.884, "dur": 4.609, + "args": { + "External id": 227743,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115409213.598, "dur": 1.643, + "args": { + "External id": 227744,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115409218.199, "dur": 96.480, + "args": { + "External id": 227745,"Sequence number": 2757841, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409220.462, "dur": 4.437, + "args": { + "External id": 227746,"Sequence number": 2757841, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409221.702, "dur": 3.049, + "args": { + "External id": 227747,"Sequence number": 2757841, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6546 + } + }, + { + "ph": "s", "id": 115, "pid": 4183442, "tid": 4183442, "ts": 667115409221.702, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115409226.113, "dur": 81.961, + "args": { + "External id": 227748,"Sequence number": 2757842, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6547 + } + }, + { + "ph": "s", "id": 114, "pid": 4183442, "tid": 4183442, "ts": 667115409226.113, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115409310.450, "dur": 3.500, + "args": { + "External id": 227749,"Sequence number": 2757843, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6548 + } + }, + { + "ph": "s", "id": 113, "pid": 4183442, "tid": 4183442, "ts": 667115409310.450, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115409348.928, "dur": 236.312, + "args": { + "External id": 227750,"Sequence number": 2757844, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6549 + } + }, + { + "ph": "s", "id": 112, "pid": 4183442, "tid": 4183442, "ts": 667115409348.928, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409369.196, "dur": 3.003, + "args": { + "External id": 227751,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409370.418, "dur": 1.571, + "args": { + "External id": 227752,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183442, "tid": 4183442, + "ts": 667115409376.367, "dur": 4.185, + "args": { + "External id": 227753,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409378.077, "dur": 2.355, + "args": { + "External id": 227754,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409379.153, "dur": 1.175, + "args": { + "External id": 227755,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115409387.741, "dur": 7.485, + "args": { + "External id": 227756,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115409390.143, "dur": 4.782, + "args": { + "External id": 227757,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115409402.114, "dur": 3.268, + "args": { + "External id": 227758,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115409409.410, "dur": 4.038, + "args": { + "External id": 227759,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409558.841, "dur": 6.929, + "args": { + "External id": 227760,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409562.411, "dur": 2.972, + "args": { + "External id": 227761,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409568.871, "dur": 2.604, + "args": { + "External id": 227762,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409570.307, "dur": 1.043, + "args": { + "External id": 227763,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115409604.912, "dur": 162.551, + "args": { + "External id": 227764,"Sequence number": 2757845, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115409605.952, "dur": 8.855, + "args": { + "External id": 227765,"Sequence number": 2757845, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6564 + } + }, + { + "ph": "s", "id": 111, "pid": 4183442, "tid": 4183442, "ts": 667115409605.952, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115409608.757, "dur": 4.891, + "args": { + "External id": 227766,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115409611.374, "dur": 1.954, + "args": { + "External id": 227767,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115409615.741, "dur": 151.427, + "args": { + "External id": 227768,"Sequence number": 2757846, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409617.935, "dur": 6.272, + "args": { + "External id": 227769,"Sequence number": 2757846, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409619.192, "dur": 4.842, + "args": { + "External id": 227770,"Sequence number": 2757846, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6569 + } + }, + { + "ph": "s", "id": 110, "pid": 4183442, "tid": 4183442, "ts": 667115409619.192, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115409625.144, "dur": 114.600, + "args": { + "External id": 227771,"Sequence number": 2757847, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6570 + } + }, + { + "ph": "s", "id": 109, "pid": 4183442, "tid": 4183442, "ts": 667115409625.144, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115409760.307, "dur": 5.977, + "args": { + "External id": 227772,"Sequence number": 2757848, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6571 + } + }, + { + "ph": "s", "id": 108, "pid": 4183442, "tid": 4183442, "ts": 667115409760.307, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115409778.340, "dur": 72.731, + "args": { + "External id": 227773,"Sequence number": 2757849, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115409779.406, "dur": 7.293, + "args": { + "External id": 227774,"Sequence number": 2757849, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6573 + } + }, + { + "ph": "s", "id": 107, "pid": 4183442, "tid": 4183442, "ts": 667115409779.406, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115409781.265, "dur": 4.210, + "args": { + "External id": 227775,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115409783.899, "dur": 1.401, + "args": { + "External id": 227776,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115409787.550, "dur": 63.301, + "args": { + "External id": 227777,"Sequence number": 2757850, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409788.816, "dur": 5.643, + "args": { + "External id": 227778,"Sequence number": 2757850, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409789.861, "dur": 4.457, + "args": { + "External id": 227779,"Sequence number": 2757850, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6578 + } + }, + { + "ph": "s", "id": 106, "pid": 4183442, "tid": 4183442, "ts": 667115409789.861, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115409795.030, "dur": 50.901, + "args": { + "External id": 227780,"Sequence number": 2757851, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6579 + } + }, + { + "ph": "s", "id": 105, "pid": 4183442, "tid": 4183442, "ts": 667115409795.030, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115409847.946, "dur": 2.557, + "args": { + "External id": 227781,"Sequence number": 2757852, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6580 + } + }, + { + "ph": "s", "id": 104, "pid": 4183442, "tid": 4183442, "ts": 667115409847.946, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115409874.756, "dur": 151.214, + "args": { + "External id": 227782,"Sequence number": 2757853, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6581 + } + }, + { + "ph": "s", "id": 103, "pid": 4183442, "tid": 4183442, "ts": 667115409874.756, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115409913.154, "dur": 5.193, + "args": { + "External id": 227783,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115409948.466, "dur": 62.985, + "args": { + "External id": 227784,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115409949.217, "dur": 7.709, + "args": { + "External id": 227785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115409950.483, "dur": 5.228, + "args": { + "External id": 227786,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115409954.733, "dur": 0.776, + "args": { + "External id": 227787,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115409957.845, "dur": 53.364, + "args": { + "External id": 227788,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115409959.818, "dur": 2.899, + "args": { + "External id": 227789,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115409961.225, "dur": 1.332, + "args": { + "External id": 227790,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115409963.816, "dur": 43.487, + "args": { + "External id": 227791,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115410009.377, "dur": 1.333, + "args": { + "External id": 227792,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115410034.916, "dur": 25.424, + "args": { + "External id": 227793,"Sequence number": 2757854, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6592 + } + }, + { + "ph": "s", "id": 102, "pid": 4183442, "tid": 4183442, "ts": 667115410034.916, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115410094.788, "dur": 183.482, + "args": { + "External id": 227794,"Sequence number": 2757855, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6593 + } + }, + { + "ph": "s", "id": 101, "pid": 4183442, "tid": 4183442, "ts": 667115410094.788, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410113.407, "dur": 3.410, + "args": { + "External id": 227795,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410114.388, "dur": 2.238, + "args": { + "External id": 227796,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115410125.219, "dur": 8.219, + "args": { + "External id": 227797,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115410128.366, "dur": 4.608, + "args": { + "External id": 227798,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115410139.788, "dur": 3.837, + "args": { + "External id": 227799,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410263.371, "dur": 2.987, + "args": { + "External id": 227800,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410264.319, "dur": 1.842, + "args": { + "External id": 227801,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115410299.513, "dur": 86.801, + "args": { + "External id": 227802,"Sequence number": 2757856, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115410300.574, "dur": 8.740, + "args": { + "External id": 227803,"Sequence number": 2757856, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6602 + } + }, + { + "ph": "s", "id": 100, "pid": 4183442, "tid": 4183442, "ts": 667115410300.574, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115410303.193, "dur": 4.721, + "args": { + "External id": 227804,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115410305.734, "dur": 1.963, + "args": { + "External id": 227805,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115410310.444, "dur": 75.626, + "args": { + "External id": 227806,"Sequence number": 2757857, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410312.456, "dur": 4.087, + "args": { + "External id": 227807,"Sequence number": 2757857, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410313.742, "dur": 2.637, + "args": { + "External id": 227808,"Sequence number": 2757857, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6607 + } + }, + { + "ph": "s", "id": 99, "pid": 4183442, "tid": 4183442, "ts": 667115410313.742, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115410317.620, "dur": 58.386, + "args": { + "External id": 227809,"Sequence number": 2757858, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6608 + } + }, + { + "ph": "s", "id": 98, "pid": 4183442, "tid": 4183442, "ts": 667115410317.620, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115410378.108, "dur": 7.252, + "args": { + "External id": 227810,"Sequence number": 2757859, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6609 + } + }, + { + "ph": "s", "id": 97, "pid": 4183442, "tid": 4183442, "ts": 667115410378.108, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115410394.778, "dur": 62.921, + "args": { + "External id": 227811,"Sequence number": 2757860, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115410395.656, "dur": 5.690, + "args": { + "External id": 227812,"Sequence number": 2757860, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6611 + } + }, + { + "ph": "s", "id": 96, "pid": 4183442, "tid": 4183442, "ts": 667115410395.656, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115410397.162, "dur": 2.964, + "args": { + "External id": 227813,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115410399.065, "dur": 0.856, + "args": { + "External id": 227814,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115410402.526, "dur": 54.976, + "args": { + "External id": 227815,"Sequence number": 2757861, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410404.212, "dur": 3.468, + "args": { + "External id": 227816,"Sequence number": 2757861, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410405.159, "dur": 2.372, + "args": { + "External id": 227817,"Sequence number": 2757861, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6616 + } + }, + { + "ph": "s", "id": 95, "pid": 4183442, "tid": 4183442, "ts": 667115410405.159, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115410408.445, "dur": 44.838, + "args": { + "External id": 227818,"Sequence number": 2757862, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6617 + } + }, + { + "ph": "s", "id": 94, "pid": 4183442, "tid": 4183442, "ts": 667115410408.445, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115410454.908, "dur": 2.311, + "args": { + "External id": 227819,"Sequence number": 2757863, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6618 + } + }, + { + "ph": "s", "id": 93, "pid": 4183442, "tid": 4183442, "ts": 667115410454.908, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115410464.015, "dur": 84.186, + "args": { + "External id": 227820,"Sequence number": 2757864, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115410464.641, "dur": 5.694, + "args": { + "External id": 227821,"Sequence number": 2757864, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6620 + } + }, + { + "ph": "s", "id": 92, "pid": 4183442, "tid": 4183442, "ts": 667115410464.641, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115410466.197, "dur": 2.980, + "args": { + "External id": 227822,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115410468.023, "dur": 1.020, + "args": { + "External id": 227823,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115410471.070, "dur": 76.853, + "args": { + "External id": 227824,"Sequence number": 2757865, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410472.708, "dur": 4.564, + "args": { + "External id": 227825,"Sequence number": 2757865, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410473.715, "dur": 3.428, + "args": { + "External id": 227826,"Sequence number": 2757865, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6625 + } + }, + { + "ph": "s", "id": 91, "pid": 4183442, "tid": 4183442, "ts": 667115410473.715, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115410477.926, "dur": 63.026, + "args": { + "External id": 227827,"Sequence number": 2757866, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6626 + } + }, + { + "ph": "s", "id": 90, "pid": 4183442, "tid": 4183442, "ts": 667115410477.926, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115410544.321, "dur": 3.180, + "args": { + "External id": 227828,"Sequence number": 2757867, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6627 + } + }, + { + "ph": "s", "id": 89, "pid": 4183442, "tid": 4183442, "ts": 667115410544.321, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410565.485, "dur": 5.022, + "args": { + "External id": 227829,"Sequence number": 2757868, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410566.622, "dur": 3.726, + "args": { + "External id": 227830,"Sequence number": 2757868, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6629 + } + }, + { + "ph": "s", "id": 88, "pid": 4183442, "tid": 4183442, "ts": 667115410566.622, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410577.532, "dur": 5.813, + "args": { + "External id": 227831,"Sequence number": 2757869, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410578.696, "dur": 4.489, + "args": { + "External id": 227832,"Sequence number": 2757869, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6631 + } + }, + { + "ph": "s", "id": 87, "pid": 4183442, "tid": 4183442, "ts": 667115410578.696, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115410587.565, "dur": 3.249, + "args": { + "External id": 227833,"Sequence number": 2757870, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115410588.749, "dur": 1.929, + "args": { + "External id": 227834,"Sequence number": 2757870, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6633 + } + }, + { + "ph": "s", "id": 86, "pid": 4183442, "tid": 4183442, "ts": 667115410588.749, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115410620.735, "dur": 200.431, + "args": { + "External id": 227835,"Sequence number": 2757871, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6634 + } + }, + { + "ph": "s", "id": 85, "pid": 4183442, "tid": 4183442, "ts": 667115410620.735, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115410642.055, "dur": 44.452, + "args": { + "External id": 227836,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115410645.091, "dur": 40.348, + "args": { + "External id": 227837,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115410835.023, "dur": 110.772, + "args": { + "External id": 227838,"Sequence number": 2757872, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6637 + } + }, + { + "ph": "s", "id": 84, "pid": 4183442, "tid": 4183442, "ts": 667115410835.023, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115410849.541, "dur": 9.016, + "args": { + "External id": 227839,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115410852.051, "dur": 5.952, + "args": { + "External id": 227840,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183442, "tid": 4183442, + "ts": 667115411000.890, "dur": 180.338, + "args": { + "External id": 227841,"Sequence number": 2757873, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6640 + } + }, + { + "ph": "s", "id": 83, "pid": 4183442, "tid": 4183442, "ts": 667115411000.890, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115411028.602, "dur": 127.598, + "args": { + "External id": 227842,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115411076.968, "dur": 9.032, + "args": { + "External id": 227843,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115411079.307, "dur": 6.232, + "args": { + "External id": 227844,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115411090.693, "dur": 4.607, + "args": { + "External id": 227845,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115411096.908, "dur": 1.393, + "args": { + "External id": 227846,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115411100.812, "dur": 3.446, + "args": { + "External id": 227847,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 4183442, + "ts": 667115411167.146, "dur": 4.609, + "args": { + "External id": 227848,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411186.294, "dur": 5.287, + "args": { + "External id": 227849,"Sequence number": 2757874, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411187.323, "dur": 4.127, + "args": { + "External id": 227850,"Sequence number": 2757874, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6649 + } + }, + { + "ph": "s", "id": 82, "pid": 4183442, "tid": 4183442, "ts": 667115411187.323, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115411204.728, "dur": 112.101, + "args": { + "External id": 227851,"Sequence number": 2757875, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115411206.252, "dur": 11.156, + "args": { + "External id": 227852,"Sequence number": 2757875, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6651 + } + }, + { + "ph": "s", "id": 81, "pid": 4183442, "tid": 4183442, "ts": 667115411206.252, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115411211.692, "dur": 4.365, + "args": { + "External id": 227853,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115411214.285, "dur": 1.478, + "args": { + "External id": 227854,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115411219.052, "dur": 97.520, + "args": { + "External id": 227855,"Sequence number": 2757876, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411221.101, "dur": 3.869, + "args": { + "External id": 227856,"Sequence number": 2757876, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411222.361, "dur": 2.463, + "args": { + "External id": 227857,"Sequence number": 2757876, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6656 + } + }, + { + "ph": "s", "id": 80, "pid": 4183442, "tid": 4183442, "ts": 667115411222.361, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115411226.466, "dur": 81.450, + "args": { + "External id": 227858,"Sequence number": 2757877, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6657 + } + }, + { + "ph": "s", "id": 79, "pid": 4183442, "tid": 4183442, "ts": 667115411226.466, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115411309.885, "dur": 5.971, + "args": { + "External id": 227859,"Sequence number": 2757878, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6658 + } + }, + { + "ph": "s", "id": 78, "pid": 4183442, "tid": 4183442, "ts": 667115411309.885, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115411349.365, "dur": 224.432, + "args": { + "External id": 227860,"Sequence number": 2757879, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6659 + } + }, + { + "ph": "s", "id": 77, "pid": 4183442, "tid": 4183442, "ts": 667115411349.365, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411366.541, "dur": 3.140, + "args": { + "External id": 227861,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411367.758, "dur": 1.731, + "args": { + "External id": 227862,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183442, "tid": 4183442, + "ts": 667115411373.712, "dur": 3.360, + "args": { + "External id": 227863,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411374.769, "dur": 2.193, + "args": { + "External id": 227864,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411375.833, "dur": 1.020, + "args": { + "External id": 227865,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115411384.222, "dur": 7.079, + "args": { + "External id": 227866,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115411386.512, "dur": 4.439, + "args": { + "External id": 227867,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115411397.769, "dur": 3.309, + "args": { + "External id": 227868,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115411404.664, "dur": 3.534, + "args": { + "External id": 227869,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411548.897, "dur": 4.267, + "args": { + "External id": 227870,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411550.472, "dur": 2.400, + "args": { + "External id": 227871,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411556.178, "dur": 2.666, + "args": { + "External id": 227872,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411557.557, "dur": 1.174, + "args": { + "External id": 227873,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115411590.205, "dur": 135.914, + "args": { + "External id": 227874,"Sequence number": 2757880, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115411591.292, "dur": 8.383, + "args": { + "External id": 227875,"Sequence number": 2757880, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6674 + } + }, + { + "ph": "s", "id": 76, "pid": 4183442, "tid": 4183442, "ts": 667115411591.292, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115411594.141, "dur": 4.186, + "args": { + "External id": 227876,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115411596.410, "dur": 1.695, + "args": { + "External id": 227877,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115411600.795, "dur": 124.933, + "args": { + "External id": 227878,"Sequence number": 2757881, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411603.166, "dur": 4.368, + "args": { + "External id": 227879,"Sequence number": 2757881, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411604.659, "dur": 2.742, + "args": { + "External id": 227880,"Sequence number": 2757881, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6679 + } + }, + { + "ph": "s", "id": 75, "pid": 4183442, "tid": 4183442, "ts": 667115411604.659, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115411608.319, "dur": 107.484, + "args": { + "External id": 227881,"Sequence number": 2757882, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6680 + } + }, + { + "ph": "s", "id": 74, "pid": 4183442, "tid": 4183442, "ts": 667115411608.319, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115411719.710, "dur": 5.282, + "args": { + "External id": 227882,"Sequence number": 2757883, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6681 + } + }, + { + "ph": "s", "id": 73, "pid": 4183442, "tid": 4183442, "ts": 667115411719.710, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115411736.343, "dur": 74.243, + "args": { + "External id": 227883,"Sequence number": 2757884, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115411737.004, "dur": 7.551, + "args": { + "External id": 227884,"Sequence number": 2757884, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6683 + } + }, + { + "ph": "s", "id": 72, "pid": 4183442, "tid": 4183442, "ts": 667115411737.004, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115411739.516, "dur": 3.663, + "args": { + "External id": 227885,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115411741.678, "dur": 1.226, + "args": { + "External id": 227886,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115411745.209, "dur": 65.170, + "args": { + "External id": 227887,"Sequence number": 2757885, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411746.638, "dur": 8.038, + "args": { + "External id": 227888,"Sequence number": 2757885, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411747.782, "dur": 6.725, + "args": { + "External id": 227889,"Sequence number": 2757885, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6688 + } + }, + { + "ph": "s", "id": 71, "pid": 4183442, "tid": 4183442, "ts": 667115411747.782, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115411755.409, "dur": 47.584, + "args": { + "External id": 227890,"Sequence number": 2757886, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6689 + } + }, + { + "ph": "s", "id": 70, "pid": 4183442, "tid": 4183442, "ts": 667115411755.409, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115411805.190, "dur": 4.786, + "args": { + "External id": 227891,"Sequence number": 2757887, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6690 + } + }, + { + "ph": "s", "id": 69, "pid": 4183442, "tid": 4183442, "ts": 667115411805.190, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115411831.421, "dur": 144.237, + "args": { + "External id": 227892,"Sequence number": 2757888, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6691 + } + }, + { + "ph": "s", "id": 68, "pid": 4183442, "tid": 4183442, "ts": 667115411831.421, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115411869.893, "dur": 4.570, + "args": { + "External id": 227893,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115411904.688, "dur": 57.813, + "args": { + "External id": 227894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115411905.518, "dur": 5.244, + "args": { + "External id": 227895,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115411906.968, "dur": 2.794, + "args": { + "External id": 227896,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115411908.667, "dur": 0.935, + "args": { + "External id": 227897,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115411911.677, "dur": 50.553, + "args": { + "External id": 227898,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115411913.526, "dur": 2.706, + "args": { + "External id": 227899,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115411914.529, "dur": 1.592, + "args": { + "External id": 227900,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115411917.162, "dur": 41.077, + "args": { + "External id": 227901,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115411960.343, "dur": 1.328, + "args": { + "External id": 227902,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115411984.450, "dur": 25.027, + "args": { + "External id": 227903,"Sequence number": 2757889, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6702 + } + }, + { + "ph": "s", "id": 67, "pid": 4183442, "tid": 4183442, "ts": 667115411984.450, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115412043.056, "dur": 176.068, + "args": { + "External id": 227904,"Sequence number": 2757890, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6703 + } + }, + { + "ph": "s", "id": 66, "pid": 4183442, "tid": 4183442, "ts": 667115412043.056, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412061.982, "dur": 3.196, + "args": { + "External id": 227905,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412063.211, "dur": 1.807, + "args": { + "External id": 227906,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115412073.322, "dur": 7.331, + "args": { + "External id": 227907,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115412076.383, "dur": 3.837, + "args": { + "External id": 227908,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115412086.868, "dur": 4.124, + "args": { + "External id": 227909,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412204.091, "dur": 3.357, + "args": { + "External id": 227910,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412205.300, "dur": 1.928, + "args": { + "External id": 227911,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115412239.085, "dur": 82.191, + "args": { + "External id": 227912,"Sequence number": 2757891, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115412239.961, "dur": 7.034, + "args": { + "External id": 227913,"Sequence number": 2757891, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6712 + } + }, + { + "ph": "s", "id": 65, "pid": 4183442, "tid": 4183442, "ts": 667115412239.961, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115412242.135, "dur": 3.593, + "args": { + "External id": 227914,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115412244.482, "dur": 1.040, + "args": { + "External id": 227915,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115412248.179, "dur": 72.829, + "args": { + "External id": 227916,"Sequence number": 2757892, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412250.283, "dur": 4.406, + "args": { + "External id": 227917,"Sequence number": 2757892, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412251.559, "dur": 2.998, + "args": { + "External id": 227918,"Sequence number": 2757892, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6717 + } + }, + { + "ph": "s", "id": 64, "pid": 4183442, "tid": 4183442, "ts": 667115412251.559, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115412255.566, "dur": 59.861, + "args": { + "External id": 227919,"Sequence number": 2757893, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6718 + } + }, + { + "ph": "s", "id": 63, "pid": 4183442, "tid": 4183442, "ts": 667115412255.566, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115412317.624, "dur": 2.762, + "args": { + "External id": 227920,"Sequence number": 2757894, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6719 + } + }, + { + "ph": "s", "id": 62, "pid": 4183442, "tid": 4183442, "ts": 667115412317.624, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115412328.881, "dur": 61.642, + "args": { + "External id": 227921,"Sequence number": 2757895, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115412330.051, "dur": 6.492, + "args": { + "External id": 227922,"Sequence number": 2757895, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6721 + } + }, + { + "ph": "s", "id": 61, "pid": 4183442, "tid": 4183442, "ts": 667115412330.051, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115412331.799, "dur": 3.710, + "args": { + "External id": 227923,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115412334.235, "dur": 1.120, + "args": { + "External id": 227924,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115412337.163, "dur": 53.146, + "args": { + "External id": 227925,"Sequence number": 2757896, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412338.368, "dur": 3.648, + "args": { + "External id": 227926,"Sequence number": 2757896, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412339.403, "dur": 2.493, + "args": { + "External id": 227927,"Sequence number": 2757896, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6726 + } + }, + { + "ph": "s", "id": 60, "pid": 4183442, "tid": 4183442, "ts": 667115412339.403, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115412342.588, "dur": 40.731, + "args": { + "External id": 227928,"Sequence number": 2757897, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6727 + } + }, + { + "ph": "s", "id": 59, "pid": 4183442, "tid": 4183442, "ts": 667115412342.588, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115412385.221, "dur": 4.684, + "args": { + "External id": 227929,"Sequence number": 2757898, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6728 + } + }, + { + "ph": "s", "id": 58, "pid": 4183442, "tid": 4183442, "ts": 667115412385.221, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115412397.733, "dur": 62.660, + "args": { + "External id": 227930,"Sequence number": 2757899, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115412398.387, "dur": 8.586, + "args": { + "External id": 227931,"Sequence number": 2757899, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6730 + } + }, + { + "ph": "s", "id": 57, "pid": 4183442, "tid": 4183442, "ts": 667115412398.387, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115412400.290, "dur": 5.493, + "args": { + "External id": 227932,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115412402.110, "dur": 3.490, + "args": { + "External id": 227933,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115412407.629, "dur": 52.527, + "args": { + "External id": 227934,"Sequence number": 2757900, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412408.992, "dur": 4.611, + "args": { + "External id": 227935,"Sequence number": 2757900, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412410.074, "dur": 3.411, + "args": { + "External id": 227936,"Sequence number": 2757900, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6735 + } + }, + { + "ph": "s", "id": 56, "pid": 4183442, "tid": 4183442, "ts": 667115412410.074, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115412414.301, "dur": 38.875, + "args": { + "External id": 227937,"Sequence number": 2757901, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6736 + } + }, + { + "ph": "s", "id": 55, "pid": 4183442, "tid": 4183442, "ts": 667115412414.301, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115412455.286, "dur": 4.515, + "args": { + "External id": 227938,"Sequence number": 2757902, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6737 + } + }, + { + "ph": "s", "id": 54, "pid": 4183442, "tid": 4183442, "ts": 667115412455.286, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412476.048, "dur": 4.226, + "args": { + "External id": 227939,"Sequence number": 2757903, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412477.214, "dur": 2.829, + "args": { + "External id": 227940,"Sequence number": 2757903, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6739 + } + }, + { + "ph": "s", "id": 53, "pid": 4183442, "tid": 4183442, "ts": 667115412477.214, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412486.898, "dur": 22.374, + "args": { + "External id": 227941,"Sequence number": 2757904, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412488.571, "dur": 20.172, + "args": { + "External id": 227942,"Sequence number": 2757904, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6741 + } + }, + { + "ph": "s", "id": 52, "pid": 4183442, "tid": 4183442, "ts": 667115412488.571, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115412516.569, "dur": 3.955, + "args": { + "External id": 227943,"Sequence number": 2757905, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115412517.740, "dur": 2.678, + "args": { + "External id": 227944,"Sequence number": 2757905, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6743 + } + }, + { + "ph": "s", "id": 51, "pid": 4183442, "tid": 4183442, "ts": 667115412517.740, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115412548.599, "dur": 197.694, + "args": { + "External id": 227945,"Sequence number": 2757906, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6744 + } + }, + { + "ph": "s", "id": 50, "pid": 4183442, "tid": 4183442, "ts": 667115412548.599, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115412569.118, "dur": 10.521, + "args": { + "External id": 227946,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115412571.564, "dur": 7.627, + "args": { + "External id": 227947,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115412769.116, "dur": 110.610, + "args": { + "External id": 227948,"Sequence number": 2757907, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6747 + } + }, + { + "ph": "s", "id": 49, "pid": 4183442, "tid": 4183442, "ts": 667115412769.116, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115412783.678, "dur": 8.666, + "args": { + "External id": 227949,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115412786.548, "dur": 5.397, + "args": { + "External id": 227950,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183442, "tid": 4183442, + "ts": 667115412907.482, "dur": 180.944, + "args": { + "External id": 227951,"Sequence number": 2757908, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6750 + } + }, + { + "ph": "s", "id": 48, "pid": 4183442, "tid": 4183442, "ts": 667115412907.482, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115412936.524, "dur": 126.901, + "args": { + "External id": 227952,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115412985.855, "dur": 7.504, + "args": { + "External id": 227953,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115412988.088, "dur": 4.651, + "args": { + "External id": 227954,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115412996.158, "dur": 4.531, + "args": { + "External id": 227955,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115413002.348, "dur": 1.663, + "args": { + "External id": 227956,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115413006.824, "dur": 5.387, + "args": { + "External id": 227957,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183442, "tid": 4183442, + "ts": 667115413074.586, "dur": 4.404, + "args": { + "External id": 227958,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413093.527, "dur": 6.049, + "args": { + "External id": 227959,"Sequence number": 2757909, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413095.073, "dur": 4.340, + "args": { + "External id": 227960,"Sequence number": 2757909, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6759 + } + }, + { + "ph": "s", "id": 47, "pid": 4183442, "tid": 4183442, "ts": 667115413095.073, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115413112.064, "dur": 104.946, + "args": { + "External id": 227961,"Sequence number": 2757910, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115413113.867, "dur": 9.224, + "args": { + "External id": 227962,"Sequence number": 2757910, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6761 + } + }, + { + "ph": "s", "id": 46, "pid": 4183442, "tid": 4183442, "ts": 667115413113.867, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115413117.461, "dur": 4.642, + "args": { + "External id": 227963,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115413120.277, "dur": 1.544, + "args": { + "External id": 227964,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115413125.000, "dur": 91.691, + "args": { + "External id": 227965,"Sequence number": 2757911, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413127.263, "dur": 4.328, + "args": { + "External id": 227966,"Sequence number": 2757911, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413128.919, "dur": 2.533, + "args": { + "External id": 227967,"Sequence number": 2757911, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6766 + } + }, + { + "ph": "s", "id": 45, "pid": 4183442, "tid": 4183442, "ts": 667115413128.919, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115413132.947, "dur": 77.219, + "args": { + "External id": 227968,"Sequence number": 2757912, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6767 + } + }, + { + "ph": "s", "id": 44, "pid": 4183442, "tid": 4183442, "ts": 667115413132.947, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115413212.571, "dur": 3.344, + "args": { + "External id": 227969,"Sequence number": 2757913, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6768 + } + }, + { + "ph": "s", "id": 43, "pid": 4183442, "tid": 4183442, "ts": 667115413212.571, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115413248.874, "dur": 196.343, + "args": { + "External id": 227970,"Sequence number": 2757914, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6769 + } + }, + { + "ph": "s", "id": 42, "pid": 4183442, "tid": 4183442, "ts": 667115413248.874, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413265.920, "dur": 2.540, + "args": { + "External id": 227971,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413266.947, "dur": 1.325, + "args": { + "External id": 227972,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183442, "tid": 4183442, + "ts": 667115413272.891, "dur": 3.982, + "args": { + "External id": 227973,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413274.254, "dur": 2.491, + "args": { + "External id": 227974,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413275.534, "dur": 1.084, + "args": { + "External id": 227975,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115413283.843, "dur": 6.968, + "args": { + "External id": 227976,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115413286.038, "dur": 4.427, + "args": { + "External id": 227977,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115413297.044, "dur": 3.282, + "args": { + "External id": 227978,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115413303.810, "dur": 3.537, + "args": { + "External id": 227979,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413423.823, "dur": 5.716, + "args": { + "External id": 227980,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413425.398, "dur": 3.930, + "args": { + "External id": 227981,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413432.159, "dur": 2.752, + "args": { + "External id": 227982,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413433.687, "dur": 1.118, + "args": { + "External id": 227983,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115413461.036, "dur": 113.409, + "args": { + "External id": 227984,"Sequence number": 2757915, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115413462.079, "dur": 7.189, + "args": { + "External id": 227985,"Sequence number": 2757915, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6784 + } + }, + { + "ph": "s", "id": 41, "pid": 4183442, "tid": 4183442, "ts": 667115413462.079, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115413464.004, "dur": 4.141, + "args": { + "External id": 227986,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115413466.592, "dur": 1.353, + "args": { + "External id": 227987,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115413470.969, "dur": 103.194, + "args": { + "External id": 227988,"Sequence number": 2757916, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413472.722, "dur": 6.015, + "args": { + "External id": 227989,"Sequence number": 2757916, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413473.948, "dur": 4.647, + "args": { + "External id": 227990,"Sequence number": 2757916, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6789 + } + }, + { + "ph": "s", "id": 40, "pid": 4183442, "tid": 4183442, "ts": 667115413473.948, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115413479.610, "dur": 87.402, + "args": { + "External id": 227991,"Sequence number": 2757917, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6790 + } + }, + { + "ph": "s", "id": 39, "pid": 4183442, "tid": 4183442, "ts": 667115413479.610, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115413570.110, "dur": 3.492, + "args": { + "External id": 227992,"Sequence number": 2757918, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6791 + } + }, + { + "ph": "s", "id": 38, "pid": 4183442, "tid": 4183442, "ts": 667115413570.110, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115413583.907, "dur": 107.277, + "args": { + "External id": 227993,"Sequence number": 2757919, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115413585.141, "dur": 12.337, + "args": { + "External id": 227994,"Sequence number": 2757919, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6793 + } + }, + { + "ph": "s", "id": 37, "pid": 4183442, "tid": 4183442, "ts": 667115413585.141, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115413590.129, "dur": 5.827, + "args": { + "External id": 227995,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115413594.589, "dur": 1.234, + "args": { + "External id": 227996,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115413598.556, "dur": 92.275, + "args": { + "External id": 227997,"Sequence number": 2757920, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413599.880, "dur": 5.761, + "args": { + "External id": 227998,"Sequence number": 2757920, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413601.482, "dur": 3.995, + "args": { + "External id": 227999,"Sequence number": 2757920, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6798 + } + }, + { + "ph": "s", "id": 36, "pid": 4183442, "tid": 4183442, "ts": 667115413601.482, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115413606.687, "dur": 42.966, + "args": { + "External id": 228000,"Sequence number": 2757921, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6799 + } + }, + { + "ph": "s", "id": 35, "pid": 4183442, "tid": 4183442, "ts": 667115413606.687, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115413651.392, "dur": 38.487, + "args": { + "External id": 228001,"Sequence number": 2757922, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6800 + } + }, + { + "ph": "s", "id": 34, "pid": 4183442, "tid": 4183442, "ts": 667115413651.392, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115413714.202, "dur": 156.729, + "args": { + "External id": 228002,"Sequence number": 2757923, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6801 + } + }, + { + "ph": "s", "id": 33, "pid": 4183442, "tid": 4183442, "ts": 667115413714.202, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115413754.415, "dur": 6.113, + "args": { + "External id": 228003,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115413794.818, "dur": 61.771, + "args": { + "External id": 228004,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115413795.716, "dur": 5.537, + "args": { + "External id": 228005,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115413797.053, "dur": 3.301, + "args": { + "External id": 228006,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115413799.255, "dur": 0.926, + "args": { + "External id": 228007,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115413802.338, "dur": 53.932, + "args": { + "External id": 228008,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183442, "tid": 4183442, + "ts": 667115413804.334, "dur": 2.524, + "args": { + "External id": 228009,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413805.173, "dur": 1.552, + "args": { + "External id": 228010,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115413807.999, "dur": 44.433, + "args": { + "External id": 228011,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183442, "tid": 4183442, + "ts": 667115413854.392, "dur": 1.166, + "args": { + "External id": 228012,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115413879.766, "dur": 23.630, + "args": { + "External id": 228013,"Sequence number": 2757924, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6812 + } + }, + { + "ph": "s", "id": 32, "pid": 4183442, "tid": 4183442, "ts": 667115413879.766, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 4183442, "tid": 4183442, + "ts": 667115413921.046, "dur": 38.541, + "args": { + "External id": 228014,"Sequence number": 2757925, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "-2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1]], []], "Input Dims": [[[16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024]], []], "Ev Idx": 6813 + } + }, + { + "ph": "s", "id": 31, "pid": 4183442, "tid": 4183442, "ts": 667115413921.046, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 4183442, "tid": 4183442, + "ts": 667115413929.311, "dur": 25.330, + "args": { + "External id": 228015,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1]], []], "Input Dims": [[[16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024]], []], "Ev Idx": 6814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115413956.625, "dur": 1.558, + "args": { + "External id": 228016,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 4096], []], "Ev Idx": 6815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183442, "tid": 4183442, + "ts": 667115413994.325, "dur": 56.187, + "args": { + "External id": 228017,"Record function id": 0, "Ev Idx": 6816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 2/0", "pid": 4183442, "tid": 4183442, + "ts": 667115414052.026, "dur": 186.094, + "args": { + "External id": 228018,"Record function id": 0, "Ev Idx": 6817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115414086.215, "dur": 143.954, + "args": { + "External id": 228019,"Sequence number": 2757926, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1], [16777216, 4096, 1024, 1]], "Input Dims": [[1024], [16, 4096, 4, 1024]], "Ev Idx": 6818 + } + }, + { + "ph": "s", "id": 30, "pid": 4183442, "tid": 4183442, "ts": 667115414086.215, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183442, "tid": 4183442, + "ts": 667115414154.671, "dur": 38.912, + "args": { + "External id": 228020,"kernel_hash": "c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/2a/c2aznfmnsqecy5jxsdvvxqa2d6egj3rlv42aexfrxxtx2wolgw6i.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 1024], [262144, 1024], [1024], [262144], [], [], [], [], [], [], [], [], []], "Ev Idx": 6819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115414318.548, "dur": 36.366, + "args": { + "External id": 228021,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115414321.264, "dur": 4.826, + "args": { + "External id": 228022,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115414328.534, "dur": 26.046, + "args": { + "External id": 228023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115414332.063, "dur": 21.986, + "args": { + "External id": 228024,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 6823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115414358.942, "dur": 20.245, + "args": { + "External id": 228025,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115414360.249, "dur": 3.565, + "args": { + "External id": 228026,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115414364.636, "dur": 14.319, + "args": { + "External id": 228027,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115414365.523, "dur": 13.091, + "args": { + "External id": 228028,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 6827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115414382.035, "dur": 16.414, + "args": { + "External id": 228029,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115414383.236, "dur": 2.675, + "args": { + "External id": 228030,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115414387.134, "dur": 11.073, + "args": { + "External id": 228031,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115414387.694, "dur": 10.135, + "args": { + "External id": 228032,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 6831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115414407.522, "dur": 0.844, + "args": { + "External id": 228033,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 6832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 4183442, "tid": 4183442, + "ts": 667115414416.013, "dur": 8.639, + "args": { + "External id": 228034,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "5", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 6833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414421.581, "dur": 1.727, + "args": { + "External id": 228035,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 6834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414430.641, "dur": 7.247, + "args": { + "External id": 228036,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 6835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414434.618, "dur": 1.700, + "args": { + "External id": 228037,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 6836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414439.453, "dur": 4.014, + "args": { + "External id": 228038,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 6837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414441.510, "dur": 1.083, + "args": { + "External id": 228039,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 6838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414444.875, "dur": 3.936, + "args": { + "External id": 228040,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 6839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414447.472, "dur": 0.836, + "args": { + "External id": 228041,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 6840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414451.790, "dur": 3.183, + "args": { + "External id": 228042,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 6841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414453.682, "dur": 0.742, + "args": { + "External id": 228043,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 6842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414456.244, "dur": 3.945, + "args": { + "External id": 228044,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 6843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414458.177, "dur": 0.977, + "args": { + "External id": 228045,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 6844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414461.419, "dur": 3.045, + "args": { + "External id": 228046,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4096, 4], [], [], [], []], "Ev Idx": 6845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414463.297, "dur": 0.639, + "args": { + "External id": 228047,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 6846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115414469.247, "dur": 5.274, + "args": { + "External id": 228048,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4096, 4], [], []], "Ev Idx": 6847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414472.607, "dur": 1.248, + "args": { + "External id": 228049,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 6848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414478.327, "dur": 3.893, + "args": { + "External id": 228050,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 6849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414480.662, "dur": 1.007, + "args": { + "External id": 228051,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 6850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115414485.716, "dur": 29.108, + "args": { + "External id": 228052,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 6851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414511.860, "dur": 1.336, + "args": { + "External id": 228053,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 6852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414516.481, "dur": 4.102, + "args": { + "External id": 228054,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 6853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414519.159, "dur": 0.782, + "args": { + "External id": 228055,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 6854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414524.647, "dur": 6.586, + "args": { + "External id": 228056,"Sequence number": 2757927, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 6855 + } + }, + { + "ph": "s", "id": 29, "pid": 4183442, "tid": 4183442, "ts": 667115414524.647, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414528.594, "dur": 0.993, + "args": { + "External id": 228057,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 6856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414532.305, "dur": 5.011, + "args": { + "External id": 228058,"Sequence number": 2757928, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 6857 + } + }, + { + "ph": "s", "id": 28, "pid": 4183442, "tid": 4183442, "ts": 667115414532.305, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414536.032, "dur": 0.527, + "args": { + "External id": 228059,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 6858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115414538.580, "dur": 6.371, + "args": { + "External id": 228060,"Sequence number": 2757929, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 6859 + } + }, + { + "ph": "s", "id": 27, "pid": 4183442, "tid": 4183442, "ts": 667115414538.580, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414543.366, "dur": 0.760, + "args": { + "External id": 228061,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 6860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115414546.255, "dur": 4.364, + "args": { + "External id": 228062,"Sequence number": 2757930, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 6861 + } + }, + { + "ph": "s", "id": 26, "pid": 4183442, "tid": 4183442, "ts": 667115414546.255, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414548.908, "dur": 0.949, + "args": { + "External id": 228063,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 6862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115414554.783, "dur": 43.718, + "args": { + "External id": 228064,"Sequence number": 2757931, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 6863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115414557.575, "dur": 40.692, + "args": { + "External id": 228065,"Sequence number": 2757931, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 6864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115414560.333, "dur": 9.392, + "args": { + "External id": 228066,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 6865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115414562.839, "dur": 6.218, + "args": { + "External id": 228067,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115414571.221, "dur": 26.543, + "args": { + "External id": 228068,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 6867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115414622.176, "dur": 4.574, + "args": { + "External id": 228069,"Sequence number": 2757931, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6868 + } + }, + { + "ph": "s", "id": 25, "pid": 4183442, "tid": 4183442, "ts": 667115414622.176, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115414629.231, "dur": 1.433, + "args": { + "External id": 228070,"Sequence number": 2757932, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 6869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115414694.918, "dur": 21527.924, + "args": { + "External id": 228071,"Sequence number": 2757932, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 6870 + } + }, + { + "ph": "s", "id": 24, "pid": 4183442, "tid": 4183442, "ts": 667115414694.918, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115414710.796, "dur": 35.268, + "args": { + "External id": 228072,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115414711.983, "dur": 33.893, + "args": { + "External id": 228073,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115414713.875, "dur": 7.785, + "args": { + "External id": 228074,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115414716.013, "dur": 4.972, + "args": { + "External id": 228075,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115414722.595, "dur": 22.615, + "args": { + "External id": 228076,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 6875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115414762.606, "dur": 33.982, + "args": { + "External id": 228077,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115414771.551, "dur": 7.209, + "args": { + "External id": 228078,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414774.367, "dur": 4.082, + "args": { + "External id": 228079,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115414779.846, "dur": 16.548, + "args": { + "External id": 228080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 6879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115414781.242, "dur": 14.797, + "args": { + "External id": 228081,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115414800.319, "dur": 22.244, + "args": { + "External id": 228082,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 6881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115414801.363, "dur": 5.057, + "args": { + "External id": 228083,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 6882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414803.359, "dur": 2.845, + "args": { + "External id": 228084,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115414807.248, "dur": 15.101, + "args": { + "External id": 228085,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115414808.227, "dur": 13.760, + "args": { + "External id": 228086,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 6885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115414827.837, "dur": 17.149, + "args": { + "External id": 228087,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115414829.495, "dur": 2.978, + "args": { + "External id": 228088,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115414833.525, "dur": 11.198, + "args": { + "External id": 228089,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 6888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115414834.545, "dur": 9.853, + "args": { + "External id": 228090,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 6889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 4183442, + "ts": 667115414852.744, "dur": 25.154, + "args": { + "External id": 228091,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 6890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115414882.629, "dur": 61.389, + "args": { + "External id": 228092,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 6891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115414886.439, "dur": 57.098, + "args": { + "External id": 228093,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414893.137, "dur": 1.205, + "args": { + "External id": 228094,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 6893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115414896.111, "dur": 29.157, + "args": { + "External id": 228095,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115414900.137, "dur": 24.932, + "args": { + "External id": 228096,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 6895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115414902.716, "dur": 3.496, + "args": { + "External id": 228097,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115414907.175, "dur": 17.546, + "args": { + "External id": 228098,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 6897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 4183442, + "ts": 667115414948.976, "dur": 15459.271, + "args": { + "External id": 228099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 6898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 4183442, + "ts": 667115414950.972, "dur": 15456.128, + "args": { + "External id": 228100,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 6899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115430419.737, "dur": 7.935, + "args": { + "External id": 228101,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115430424.356, "dur": 1.327, + "args": { + "External id": 228102,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115430433.237, "dur": 123.100, + "args": { + "External id": 228103,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 6902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115430435.035, "dur": 7.543, + "args": { + "External id": 228104,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115430437.566, "dur": 4.032, + "args": { + "External id": 228105,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 6904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115430440.094, "dur": 1.272, + "args": { + "External id": 228106,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 6905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115430444.305, "dur": 111.161, + "args": { + "External id": 228107,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115430446.562, "dur": 107.764, + "args": { + "External id": 228108,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115430561.487, "dur": 5.937, + "args": { + "External id": 228109,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115430564.729, "dur": 1.055, + "args": { + "External id": 228110,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115430577.145, "dur": 4.048, + "args": { + "External id": 228111,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 6910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115430591.996, "dur": 8.060, + "args": { + "External id": 228112,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 6911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115430595.145, "dur": 4.613, + "args": { + "External id": 228113,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115430769.206, "dur": 233.811, + "args": { + "External id": 228114,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115430772.866, "dur": 5.424, + "args": { + "External id": 228115,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115430781.384, "dur": 221.111, + "args": { + "External id": 228116,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 6915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115430784.361, "dur": 0.841, + "args": { + "External id": 228117,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115430788.341, "dur": 28.207, + "args": { + "External id": 228118,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115430819.351, "dur": 6.596, + "args": { + "External id": 228119,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 6918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115430824.296, "dur": 1.138, + "args": { + "External id": 228120,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 6919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115430828.014, "dur": 26.046, + "args": { + "External id": 228121,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115430829.698, "dur": 1.229, + "args": { + "External id": 228122,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115430833.349, "dur": 20.414, + "args": { + "External id": 228123,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 6922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115430837.848, "dur": 3.493, + "args": { + "External id": 228124,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115430856.588, "dur": 22.817, + "args": { + "External id": 228125,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115430882.185, "dur": 17.279, + "args": { + "External id": 228126,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115430902.994, "dur": 16.338, + "args": { + "External id": 228127,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 6926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115430922.103, "dur": 15.454, + "args": { + "External id": 228128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115430940.569, "dur": 27.366, + "args": { + "External id": 228129,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 6928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115430945.069, "dur": 2.095, + "args": { + "External id": 228130,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115430949.930, "dur": 0.811, + "args": { + "External id": 228131,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 6930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115430970.882, "dur": 16.488, + "args": { + "External id": 228132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115430989.528, "dur": 12.197, + "args": { + "External id": 228133,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115431010.235, "dur": 2.548, + "args": { + "External id": 228134,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115431020.291, "dur": 4.267, + "args": { + "External id": 228135,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431022.809, "dur": 0.962, + "args": { + "External id": 228136,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115431110.967, "dur": 66.445, + "args": { + "External id": 228137,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 6936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115431183.017, "dur": 5.254, + "args": { + "External id": 228138,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431185.916, "dur": 1.092, + "args": { + "External id": 228139,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115431190.025, "dur": 30.689, + "args": { + "External id": 228140,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 6939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115431226.194, "dur": 7.274, + "args": { + "External id": 228141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 6940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115431228.395, "dur": 4.307, + "args": { + "External id": 228142,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 6941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431230.799, "dur": 1.690, + "args": { + "External id": 228143,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 6942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115431237.196, "dur": 53.470, + "args": { + "External id": 228144,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115431238.817, "dur": 51.164, + "args": { + "External id": 228145,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115431296.472, "dur": 18.200, + "args": { + "External id": 228146,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 6945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115431320.844, "dur": 4.740, + "args": { + "External id": 228147,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431323.631, "dur": 0.911, + "args": { + "External id": 228148,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115431330.513, "dur": 59.648, + "args": { + "External id": 228149,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 6948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115431331.699, "dur": 11.554, + "args": { + "External id": 228150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115431332.747, "dur": 9.858, + "args": { + "External id": 228151,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 6950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431341.713, "dur": 0.729, + "args": { + "External id": 228152,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 6951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115431344.377, "dur": 45.410, + "args": { + "External id": 228153,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115431345.331, "dur": 43.857, + "args": { + "External id": 228154,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115431394.473, "dur": 4.548, + "args": { + "External id": 228155,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431396.900, "dur": 0.915, + "args": { + "External id": 228156,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115431404.881, "dur": 2.004, + "args": { + "External id": 228157,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 6956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115431414.980, "dur": 9.128, + "args": { + "External id": 228158,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 6957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115431417.683, "dur": 6.082, + "args": { + "External id": 228159,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115431538.739, "dur": 299.491, + "args": { + "External id": 228160,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115431540.927, "dur": 3.436, + "args": { + "External id": 228161,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115431546.292, "dur": 291.489, + "args": { + "External id": 228162,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 6961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115431548.389, "dur": 0.664, + "args": { + "External id": 228163,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115431550.952, "dur": 33.352, + "args": { + "External id": 228164,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115431586.493, "dur": 3.871, + "args": { + "External id": 228165,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 6964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431588.804, "dur": 1.289, + "args": { + "External id": 228166,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 6965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115431591.832, "dur": 31.808, + "args": { + "External id": 228167,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115431593.092, "dur": 1.702, + "args": { + "External id": 228168,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115431596.327, "dur": 27.021, + "args": { + "External id": 228169,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 6968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115431601.853, "dur": 2.840, + "args": { + "External id": 228170,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115431625.631, "dur": 58.742, + "args": { + "External id": 228171,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115431687.326, "dur": 35.009, + "args": { + "External id": 228172,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115431726.093, "dur": 27.298, + "args": { + "External id": 228173,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 6972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115431755.677, "dur": 26.513, + "args": { + "External id": 228174,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115431784.571, "dur": 26.027, + "args": { + "External id": 228175,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 6974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115431786.762, "dur": 2.757, + "args": { + "External id": 228176,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431792.545, "dur": 0.806, + "args": { + "External id": 228177,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 6976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115431812.767, "dur": 11.381, + "args": { + "External id": 228178,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115431825.168, "dur": 11.741, + "args": { + "External id": 228179,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115431845.940, "dur": 2.703, + "args": { + "External id": 228180,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115431858.801, "dur": 4.565, + "args": { + "External id": 228181,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431861.590, "dur": 0.941, + "args": { + "External id": 228182,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115431939.276, "dur": 50.493, + "args": { + "External id": 228183,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 6982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115431995.025, "dur": 4.864, + "args": { + "External id": 228184,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115431997.871, "dur": 0.921, + "args": { + "External id": 228185,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115432001.836, "dur": 24.976, + "args": { + "External id": 228186,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 6985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115432031.951, "dur": 16.229, + "args": { + "External id": 228187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 6986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115432040.426, "dur": 6.977, + "args": { + "External id": 228188,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 6987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432044.041, "dur": 3.099, + "args": { + "External id": 228189,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 6988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115432051.506, "dur": 45.301, + "args": { + "External id": 228190,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115432052.857, "dur": 43.080, + "args": { + "External id": 228191,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115432101.208, "dur": 14.839, + "args": { + "External id": 228192,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 6991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115432122.061, "dur": 4.866, + "args": { + "External id": 228193,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432124.855, "dur": 1.155, + "args": { + "External id": 228194,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115432131.045, "dur": 49.459, + "args": { + "External id": 228195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 6994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115432132.346, "dur": 4.241, + "args": { + "External id": 228196,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115432133.109, "dur": 2.893, + "args": { + "External id": 228197,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 6996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432134.864, "dur": 0.973, + "args": { + "External id": 228198,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 6997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115432137.471, "dur": 42.627, + "args": { + "External id": 228199,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115432138.581, "dur": 40.918, + "args": { + "External id": 228200,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115432185.122, "dur": 4.148, + "args": { + "External id": 228201,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432187.092, "dur": 1.058, + "args": { + "External id": 228202,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115432195.106, "dur": 1.526, + "args": { + "External id": 228203,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115432203.837, "dur": 7.173, + "args": { + "External id": 228204,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115432206.790, "dur": 3.940, + "args": { + "External id": 228205,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115432295.353, "dur": 188.657, + "args": { + "External id": 228206,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115432297.434, "dur": 2.408, + "args": { + "External id": 228207,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115432303.975, "dur": 179.621, + "args": { + "External id": 228208,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115432305.676, "dur": 0.565, + "args": { + "External id": 228209,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115432307.730, "dur": 21.021, + "args": { + "External id": 228210,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115432330.703, "dur": 6.122, + "args": { + "External id": 228211,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432333.163, "dur": 3.414, + "args": { + "External id": 228212,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115432337.951, "dur": 21.583, + "args": { + "External id": 228213,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115432339.244, "dur": 1.762, + "args": { + "External id": 228214,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115432342.306, "dur": 16.850, + "args": { + "External id": 228215,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115432345.195, "dur": 2.581, + "args": { + "External id": 228216,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115432361.183, "dur": 20.331, + "args": { + "External id": 228217,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115432383.107, "dur": 14.682, + "args": { + "External id": 228218,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115432400.279, "dur": 13.523, + "args": { + "External id": 228219,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115432415.514, "dur": 13.212, + "args": { + "External id": 228220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115432431.050, "dur": 21.387, + "args": { + "External id": 228221,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115432433.198, "dur": 1.727, + "args": { + "External id": 228222,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432437.233, "dur": 0.697, + "args": { + "External id": 228223,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115432454.171, "dur": 11.895, + "args": { + "External id": 228224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115432467.251, "dur": 15.222, + "args": { + "External id": 228225,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115432489.857, "dur": 19.532, + "args": { + "External id": 228226,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115432521.150, "dur": 4.211, + "args": { + "External id": 228227,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432524.094, "dur": 0.505, + "args": { + "External id": 228228,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115432595.888, "dur": 45.549, + "args": { + "External id": 228229,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115432646.416, "dur": 41.527, + "args": { + "External id": 228230,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432649.299, "dur": 36.232, + "args": { + "External id": 228231,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115432690.368, "dur": 27.757, + "args": { + "External id": 228232,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115432724.166, "dur": 6.834, + "args": { + "External id": 228233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115432725.918, "dur": 4.285, + "args": { + "External id": 228234,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432728.574, "dur": 1.182, + "args": { + "External id": 228235,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115432734.312, "dur": 47.610, + "args": { + "External id": 228236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115432735.644, "dur": 45.459, + "args": { + "External id": 228237,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115432785.797, "dur": 14.246, + "args": { + "External id": 228238,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115432806.509, "dur": 4.420, + "args": { + "External id": 228239,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432808.996, "dur": 0.977, + "args": { + "External id": 228240,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115432814.853, "dur": 48.733, + "args": { + "External id": 228241,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115432815.982, "dur": 5.046, + "args": { + "External id": 228242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115432817.108, "dur": 3.345, + "args": { + "External id": 228243,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432819.167, "dur": 0.959, + "args": { + "External id": 228244,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115432821.833, "dur": 41.402, + "args": { + "External id": 228245,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115432822.562, "dur": 40.024, + "args": { + "External id": 228246,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115432867.499, "dur": 4.097, + "args": { + "External id": 228247,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115432869.573, "dur": 0.919, + "args": { + "External id": 228248,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115432877.709, "dur": 1.760, + "args": { + "External id": 228249,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115432887.057, "dur": 6.761, + "args": { + "External id": 228250,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115432889.302, "dur": 4.258, + "args": { + "External id": 228251,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115432978.659, "dur": 175.479, + "args": { + "External id": 228252,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115432980.941, "dur": 4.380, + "args": { + "External id": 228253,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115432987.054, "dur": 166.600, + "args": { + "External id": 228254,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115432988.515, "dur": 0.336, + "args": { + "External id": 228255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115432990.881, "dur": 19.390, + "args": { + "External id": 228256,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115433011.966, "dur": 5.951, + "args": { + "External id": 228257,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433016.840, "dur": 0.779, + "args": { + "External id": 228258,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115433018.912, "dur": 21.031, + "args": { + "External id": 228259,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115433020.446, "dur": 1.708, + "args": { + "External id": 228260,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115433023.556, "dur": 16.042, + "args": { + "External id": 228261,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115433026.074, "dur": 2.710, + "args": { + "External id": 228262,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115433041.503, "dur": 19.148, + "args": { + "External id": 228263,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115433062.256, "dur": 11.579, + "args": { + "External id": 228264,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115433076.727, "dur": 14.284, + "args": { + "External id": 228265,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115433092.701, "dur": 11.298, + "args": { + "External id": 228266,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115433106.032, "dur": 22.322, + "args": { + "External id": 228267,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115433107.831, "dur": 1.530, + "args": { + "External id": 228268,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433111.944, "dur": 3.591, + "args": { + "External id": 228269,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115433130.361, "dur": 10.981, + "args": { + "External id": 228270,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115433142.640, "dur": 10.137, + "args": { + "External id": 228271,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115433160.831, "dur": 1.578, + "args": { + "External id": 228272,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115433170.922, "dur": 3.367, + "args": { + "External id": 228273,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433173.090, "dur": 0.359, + "args": { + "External id": 228274,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115433239.335, "dur": 39.769, + "args": { + "External id": 228275,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115433283.561, "dur": 4.739, + "args": { + "External id": 228276,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433286.393, "dur": 0.949, + "args": { + "External id": 228277,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115433289.793, "dur": 22.630, + "args": { + "External id": 228278,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115433316.918, "dur": 6.601, + "args": { + "External id": 228279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115433318.899, "dur": 3.930, + "args": { + "External id": 228280,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433321.217, "dur": 1.446, + "args": { + "External id": 228281,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115433326.155, "dur": 44.904, + "args": { + "External id": 228282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115433327.174, "dur": 43.245, + "args": { + "External id": 228283,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115433374.941, "dur": 13.940, + "args": { + "External id": 228284,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115433394.311, "dur": 4.505, + "args": { + "External id": 228285,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433397.048, "dur": 0.882, + "args": { + "External id": 228286,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115433402.694, "dur": 47.944, + "args": { + "External id": 228287,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115433403.665, "dur": 3.971, + "args": { + "External id": 228288,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115433404.475, "dur": 2.689, + "args": { + "External id": 228289,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433406.255, "dur": 0.753, + "args": { + "External id": 228290,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115433408.415, "dur": 41.840, + "args": { + "External id": 228291,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115433409.331, "dur": 40.280, + "args": { + "External id": 228292,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115433454.881, "dur": 4.037, + "args": { + "External id": 228293,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433456.726, "dur": 1.075, + "args": { + "External id": 228294,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115433464.854, "dur": 1.388, + "args": { + "External id": 228295,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115433473.173, "dur": 6.618, + "args": { + "External id": 228296,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115433475.614, "dur": 3.922, + "args": { + "External id": 228297,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115433584.393, "dur": 233.566, + "args": { + "External id": 228298,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115433589.244, "dur": 3.147, + "args": { + "External id": 228299,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115433594.368, "dur": 222.881, + "args": { + "External id": 228300,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115433596.199, "dur": 0.325, + "args": { + "External id": 228301,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115433597.948, "dur": 22.972, + "args": { + "External id": 228302,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115433622.718, "dur": 4.906, + "args": { + "External id": 228303,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433626.418, "dur": 0.949, + "args": { + "External id": 228304,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115433628.909, "dur": 20.426, + "args": { + "External id": 228305,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115433630.457, "dur": 1.702, + "args": { + "External id": 228306,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115433633.657, "dur": 15.384, + "args": { + "External id": 228307,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115433636.466, "dur": 2.320, + "args": { + "External id": 228308,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115433651.085, "dur": 58.393, + "args": { + "External id": 228309,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115433711.958, "dur": 17.421, + "args": { + "External id": 228310,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115433732.387, "dur": 15.425, + "args": { + "External id": 228311,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115433749.539, "dur": 13.704, + "args": { + "External id": 228312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115433765.361, "dur": 22.875, + "args": { + "External id": 228313,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115433767.710, "dur": 2.034, + "args": { + "External id": 228314,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433772.114, "dur": 0.942, + "args": { + "External id": 228315,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115433790.371, "dur": 13.445, + "args": { + "External id": 228316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115433805.227, "dur": 10.418, + "args": { + "External id": 228317,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115433825.791, "dur": 2.548, + "args": { + "External id": 228318,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115433851.138, "dur": 3.938, + "args": { + "External id": 228319,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433853.665, "dur": 0.631, + "args": { + "External id": 228320,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115433926.230, "dur": 50.328, + "args": { + "External id": 228321,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115433981.255, "dur": 4.854, + "args": { + "External id": 228322,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115433983.994, "dur": 1.034, + "args": { + "External id": 228323,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115433987.602, "dur": 24.453, + "args": { + "External id": 228324,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115434016.982, "dur": 9.293, + "args": { + "External id": 228325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115434018.980, "dur": 6.462, + "args": { + "External id": 228326,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434021.602, "dur": 3.604, + "args": { + "External id": 228327,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115434028.866, "dur": 44.678, + "args": { + "External id": 228328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115434030.299, "dur": 42.547, + "args": { + "External id": 228329,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115434077.441, "dur": 15.740, + "args": { + "External id": 228330,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115434098.760, "dur": 4.602, + "args": { + "External id": 228331,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434101.241, "dur": 1.156, + "args": { + "External id": 228332,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115434107.736, "dur": 48.103, + "args": { + "External id": 228333,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115434108.875, "dur": 4.341, + "args": { + "External id": 228334,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115434109.968, "dur": 2.720, + "args": { + "External id": 228335,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434111.587, "dur": 0.954, + "args": { + "External id": 228336,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115434114.492, "dur": 40.988, + "args": { + "External id": 228337,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115434115.081, "dur": 39.663, + "args": { + "External id": 228338,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115434159.567, "dur": 3.860, + "args": { + "External id": 228339,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434161.653, "dur": 0.743, + "args": { + "External id": 228340,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115434168.819, "dur": 1.645, + "args": { + "External id": 228341,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115434178.479, "dur": 7.173, + "args": { + "External id": 228342,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115434181.087, "dur": 4.287, + "args": { + "External id": 228343,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115434264.454, "dur": 329.275, + "args": { + "External id": 228344,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115434266.581, "dur": 2.294, + "args": { + "External id": 228345,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115434272.711, "dur": 320.431, + "args": { + "External id": 228346,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115434274.391, "dur": 0.547, + "args": { + "External id": 228347,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115434276.628, "dur": 18.483, + "args": { + "External id": 228348,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115434296.672, "dur": 5.469, + "args": { + "External id": 228349,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434298.898, "dur": 2.992, + "args": { + "External id": 228350,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115434303.215, "dur": 53.424, + "args": { + "External id": 228351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115434304.420, "dur": 1.375, + "args": { + "External id": 228352,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115434332.718, "dur": 23.657, + "args": { + "External id": 228353,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115434335.909, "dur": 2.478, + "args": { + "External id": 228354,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115434358.163, "dur": 38.945, + "args": { + "External id": 228355,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115434398.795, "dur": 45.339, + "args": { + "External id": 228356,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115434446.988, "dur": 40.081, + "args": { + "External id": 228357,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115434488.838, "dur": 33.827, + "args": { + "External id": 228358,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115434525.719, "dur": 27.637, + "args": { + "External id": 228359,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115434527.956, "dur": 2.175, + "args": { + "External id": 228360,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434532.482, "dur": 0.678, + "args": { + "External id": 228361,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115434555.385, "dur": 21.775, + "args": { + "External id": 228362,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115434578.572, "dur": 13.528, + "args": { + "External id": 228363,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115434601.089, "dur": 2.184, + "args": { + "External id": 228364,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115434613.102, "dur": 3.805, + "args": { + "External id": 228365,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434615.475, "dur": 0.497, + "args": { + "External id": 228366,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115434720.642, "dur": 52.649, + "args": { + "External id": 228367,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115434778.738, "dur": 6.030, + "args": { + "External id": 228368,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434782.490, "dur": 1.009, + "args": { + "External id": 228369,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115434786.528, "dur": 24.508, + "args": { + "External id": 228370,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115434815.885, "dur": 6.386, + "args": { + "External id": 228371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115434817.625, "dur": 3.950, + "args": { + "External id": 228372,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434819.976, "dur": 1.408, + "args": { + "External id": 228373,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115434825.113, "dur": 42.980, + "args": { + "External id": 228374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115434826.258, "dur": 41.258, + "args": { + "External id": 228375,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115434872.313, "dur": 13.700, + "args": { + "External id": 228376,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115434891.784, "dur": 4.350, + "args": { + "External id": 228377,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434894.386, "dur": 0.781, + "args": { + "External id": 228378,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115434900.106, "dur": 47.999, + "args": { + "External id": 228379,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115434901.270, "dur": 4.678, + "args": { + "External id": 228380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115434901.981, "dur": 3.362, + "args": { + "External id": 228381,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434903.906, "dur": 1.244, + "args": { + "External id": 228382,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115434906.583, "dur": 41.149, + "args": { + "External id": 228383,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115434907.537, "dur": 39.611, + "args": { + "External id": 228384,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115434952.239, "dur": 3.911, + "args": { + "External id": 228385,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115434954.094, "dur": 0.993, + "args": { + "External id": 228386,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115434962.375, "dur": 1.608, + "args": { + "External id": 228387,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115434971.509, "dur": 8.739, + "args": { + "External id": 228388,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115434974.347, "dur": 5.608, + "args": { + "External id": 228389,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115435055.367, "dur": 193.160, + "args": { + "External id": 228390,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115435057.376, "dur": 2.326, + "args": { + "External id": 228391,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115435061.518, "dur": 186.534, + "args": { + "External id": 228392,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115435063.000, "dur": 0.453, + "args": { + "External id": 228393,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115435065.000, "dur": 24.410, + "args": { + "External id": 228394,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115435091.177, "dur": 3.322, + "args": { + "External id": 228395,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435093.046, "dur": 1.199, + "args": { + "External id": 228396,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115435095.707, "dur": 23.850, + "args": { + "External id": 228397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115435097.002, "dur": 1.740, + "args": { + "External id": 228398,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115435099.924, "dur": 19.266, + "args": { + "External id": 228399,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115435104.429, "dur": 2.538, + "args": { + "External id": 228400,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115435121.402, "dur": 20.291, + "args": { + "External id": 228401,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115435143.194, "dur": 13.830, + "args": { + "External id": 228402,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115435165.201, "dur": 14.327, + "args": { + "External id": 228403,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115435180.904, "dur": 14.136, + "args": { + "External id": 228404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115435196.861, "dur": 22.566, + "args": { + "External id": 228405,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115435198.861, "dur": 2.257, + "args": { + "External id": 228406,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435203.521, "dur": 1.824, + "args": { + "External id": 228407,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115435221.231, "dur": 13.717, + "args": { + "External id": 228408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115435235.883, "dur": 10.862, + "args": { + "External id": 228409,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115435254.217, "dur": 1.548, + "args": { + "External id": 228410,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115435263.804, "dur": 3.711, + "args": { + "External id": 228411,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435266.188, "dur": 0.537, + "args": { + "External id": 228412,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115435328.307, "dur": 38.704, + "args": { + "External id": 228413,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115435371.218, "dur": 6.560, + "args": { + "External id": 228414,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435374.016, "dur": 2.721, + "args": { + "External id": 228415,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115435379.412, "dur": 20.750, + "args": { + "External id": 228416,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115435404.366, "dur": 6.078, + "args": { + "External id": 228417,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115435405.611, "dur": 4.036, + "args": { + "External id": 228418,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435407.897, "dur": 1.538, + "args": { + "External id": 228419,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115435412.463, "dur": 41.133, + "args": { + "External id": 228420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115435413.767, "dur": 39.012, + "args": { + "External id": 228421,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115435456.973, "dur": 15.335, + "args": { + "External id": 228422,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115435477.599, "dur": 4.565, + "args": { + "External id": 228423,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435480.124, "dur": 1.243, + "args": { + "External id": 228424,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115435485.746, "dur": 70.798, + "args": { + "External id": 228425,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115435486.501, "dur": 20.744, + "args": { + "External id": 228426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115435487.427, "dur": 2.409, + "args": { + "External id": 228427,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435489.069, "dur": 0.617, + "args": { + "External id": 228428,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115435509.250, "dur": 46.847, + "args": { + "External id": 228429,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115435510.017, "dur": 45.517, + "args": { + "External id": 228430,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115435561.768, "dur": 4.998, + "args": { + "External id": 228431,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435564.473, "dur": 1.053, + "args": { + "External id": 228432,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115435572.771, "dur": 1.672, + "args": { + "External id": 228433,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115435581.513, "dur": 6.957, + "args": { + "External id": 228434,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115435583.721, "dur": 4.469, + "args": { + "External id": 228435,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115435700.641, "dur": 176.650, + "args": { + "External id": 228436,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115435703.136, "dur": 5.537, + "args": { + "External id": 228437,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115435710.182, "dur": 166.506, + "args": { + "External id": 228438,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115435712.011, "dur": 0.418, + "args": { + "External id": 228439,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115435713.585, "dur": 22.206, + "args": { + "External id": 228440,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115435737.277, "dur": 6.032, + "args": { + "External id": 228441,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435742.129, "dur": 0.909, + "args": { + "External id": 228442,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115435744.372, "dur": 20.173, + "args": { + "External id": 228443,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115435745.760, "dur": 1.492, + "args": { + "External id": 228444,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115435748.563, "dur": 15.697, + "args": { + "External id": 228445,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115435751.188, "dur": 2.311, + "args": { + "External id": 228446,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115435766.279, "dur": 18.980, + "args": { + "External id": 228447,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115435786.826, "dur": 12.471, + "args": { + "External id": 228448,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115435802.147, "dur": 13.424, + "args": { + "External id": 228449,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115435816.923, "dur": 10.986, + "args": { + "External id": 228450,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115435829.696, "dur": 21.399, + "args": { + "External id": 228451,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115435833.889, "dur": 1.739, + "args": { + "External id": 228452,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435838.399, "dur": 0.716, + "args": { + "External id": 228453,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115435853.442, "dur": 10.787, + "args": { + "External id": 228454,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115435865.538, "dur": 10.396, + "args": { + "External id": 228455,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115435883.900, "dur": 2.079, + "args": { + "External id": 228456,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115435894.391, "dur": 3.990, + "args": { + "External id": 228457,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115435897.012, "dur": 0.497, + "args": { + "External id": 228458,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115435958.894, "dur": 43.964, + "args": { + "External id": 228459,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115436007.554, "dur": 4.702, + "args": { + "External id": 228460,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436010.414, "dur": 0.844, + "args": { + "External id": 228461,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115436013.714, "dur": 24.406, + "args": { + "External id": 228462,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115436042.479, "dur": 6.786, + "args": { + "External id": 228463,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115436044.323, "dur": 4.236, + "args": { + "External id": 228464,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436046.523, "dur": 1.840, + "args": { + "External id": 228465,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115436051.659, "dur": 40.625, + "args": { + "External id": 228466,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115436053.007, "dur": 38.623, + "args": { + "External id": 228467,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115436096.278, "dur": 13.386, + "args": { + "External id": 228468,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115436114.054, "dur": 27.461, + "args": { + "External id": 228469,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115436116.402, "dur": 24.722, + "args": { + "External id": 228470,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436121.768, "dur": 0.916, + "args": { + "External id": 228471,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115436146.874, "dur": 30.920, + "args": { + "External id": 228472,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115436148.947, "dur": 28.576, + "args": { + "External id": 228473,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 7272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436154.114, "dur": 4.231, + "args": { + "External id": 228474,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115436159.786, "dur": 17.172, + "args": { + "External id": 228475,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115436193.596, "dur": 5.454, + "args": { + "External id": 228476,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115436195.839, "dur": 2.907, + "args": { + "External id": 228477,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115436200.044, "dur": 1.341, + "args": { + "External id": 228478,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115436200.763, "dur": 0.552, + "args": { + "External id": 228479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115436239.069, "dur": 21.490, + "args": { + "External id": 228480,"Sequence number": 2757933, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 7279 + } + }, + { + "ph": "s", "id": 23, "pid": 4183442, "tid": 4183442, "ts": 667115436239.069, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115436266.083, "dur": 5.646, + "args": { + "External id": 228481,"Sequence number": 2757934, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 7280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436269.282, "dur": 1.088, + "args": { + "External id": 228482,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115436274.492, "dur": 6.563, + "args": { + "External id": 228483,"Sequence number": 2757934, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "1"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 7282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436279.062, "dur": 0.853, + "args": { + "External id": 228484,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115436282.310, "dur": 3.089, + "args": { + "External id": 228485,"Sequence number": 2757934, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 7284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436283.835, "dur": 0.942, + "args": { + "External id": 228486,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 7285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115436289.755, "dur": 6.174, + "args": { + "External id": 228487,"Sequence number": 2757934, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7286 + } + }, + { + "ph": "s", "id": 22, "pid": 4183442, "tid": 4183442, "ts": 667115436289.755, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436293.394, "dur": 1.031, + "args": { + "External id": 228488,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115436296.999, "dur": 5.662, + "args": { + "External id": 228489,"Sequence number": 2757935, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7288 + } + }, + { + "ph": "s", "id": 21, "pid": 4183442, "tid": 4183442, "ts": 667115436296.999, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436300.803, "dur": 1.023, + "args": { + "External id": 228490,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115436303.843, "dur": 5.962, + "args": { + "External id": 228491,"Sequence number": 2757936, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 7290 + } + }, + { + "ph": "s", "id": 20, "pid": 4183442, "tid": 4183442, "ts": 667115436303.843, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436308.227, "dur": 0.754, + "args": { + "External id": 228492,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115436310.995, "dur": 4.546, + "args": { + "External id": 228493,"Sequence number": 2757937, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 7292 + } + }, + { + "ph": "s", "id": 19, "pid": 4183442, "tid": 4183442, "ts": 667115436310.995, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436313.814, "dur": 0.970, + "args": { + "External id": 228494,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 7293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115436319.425, "dur": 30.244, + "args": { + "External id": 228495,"Sequence number": 2757938, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115436321.413, "dur": 27.987, + "args": { + "External id": 228496,"Sequence number": 2757938, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115436323.901, "dur": 8.915, + "args": { + "External id": 228497,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 7296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115436326.630, "dur": 5.582, + "args": { + "External id": 228498,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115436333.712, "dur": 15.186, + "args": { + "External id": 228499,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 7298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115436375.129, "dur": 4.188, + "args": { + "External id": 228500,"Sequence number": 2757938, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 7299 + } + }, + { + "ph": "s", "id": 18, "pid": 4183442, "tid": 4183442, "ts": 667115436375.129, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115436381.803, "dur": 1.353, + "args": { + "External id": 228501,"Sequence number": 2757939, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115436413.989, "dur": 22687.077, + "args": { + "External id": 228502,"Sequence number": 2757939, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 7301 + } + }, + { + "ph": "s", "id": 17, "pid": 4183442, "tid": 4183442, "ts": 667115436413.989, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115436427.989, "dur": 25.078, + "args": { + "External id": 228503,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115436428.895, "dur": 23.952, + "args": { + "External id": 228504,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115436430.663, "dur": 5.518, + "args": { + "External id": 228505,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115436432.179, "dur": 3.586, + "args": { + "External id": 228506,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115436437.026, "dur": 15.403, + "args": { + "External id": 228507,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 7306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115436467.720, "dur": 46.662, + "args": { + "External id": 228508,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115436468.878, "dur": 6.655, + "args": { + "External id": 228509,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436471.278, "dur": 3.927, + "args": { + "External id": 228510,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115436476.809, "dur": 37.339, + "args": { + "External id": 228511,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115436479.062, "dur": 34.382, + "args": { + "External id": 228512,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115436519.387, "dur": 25.222, + "args": { + "External id": 228513,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115436520.249, "dur": 6.641, + "args": { + "External id": 228514,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436522.764, "dur": 3.826, + "args": { + "External id": 228515,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115436527.784, "dur": 16.618, + "args": { + "External id": 228516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115436528.757, "dur": 15.126, + "args": { + "External id": 228517,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 7316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115436551.363, "dur": 16.877, + "args": { + "External id": 228518,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 7317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115436552.909, "dur": 2.800, + "args": { + "External id": 228519,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115436556.257, "dur": 11.720, + "args": { + "External id": 228520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 7319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115436557.262, "dur": 10.304, + "args": { + "External id": 228521,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 4183442, + "ts": 667115436574.147, "dur": 21.610, + "args": { + "External id": 228522,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115436598.877, "dur": 48.794, + "args": { + "External id": 228523,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115436600.835, "dur": 46.476, + "args": { + "External id": 228524,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436605.904, "dur": 0.886, + "args": { + "External id": 228525,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115436608.337, "dur": 24.183, + "args": { + "External id": 228526,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115436612.280, "dur": 19.997, + "args": { + "External id": 228527,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 7326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115436614.807, "dur": 2.570, + "args": { + "External id": 228528,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115436618.543, "dur": 13.385, + "args": { + "External id": 228529,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 7328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 4183442, + "ts": 667115436686.650, "dur": 16779.270, + "args": { + "External id": 228530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 4183442, + "ts": 667115436688.324, "dur": 16776.772, + "args": { + "External id": 228531,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115453476.253, "dur": 6.360, + "args": { + "External id": 228532,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115453480.148, "dur": 0.879, + "args": { + "External id": 228533,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115453487.895, "dur": 118.777, + "args": { + "External id": 228534,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115453489.393, "dur": 17.987, + "args": { + "External id": 228535,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115453501.900, "dur": 4.340, + "args": { + "External id": 228536,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115453504.296, "dur": 1.516, + "args": { + "External id": 228537,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115453509.112, "dur": 96.949, + "args": { + "External id": 228538,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115453511.033, "dur": 93.960, + "args": { + "External id": 228539,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115453610.991, "dur": 4.297, + "args": { + "External id": 228540,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115453613.187, "dur": 0.735, + "args": { + "External id": 228541,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115453622.449, "dur": 2.750, + "args": { + "External id": 228542,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115453634.327, "dur": 7.875, + "args": { + "External id": 228543,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115453637.417, "dur": 4.506, + "args": { + "External id": 228544,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115453800.322, "dur": 230.155, + "args": { + "External id": 228545,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115453803.889, "dur": 5.416, + "args": { + "External id": 228546,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115453811.545, "dur": 218.382, + "args": { + "External id": 228547,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115453813.502, "dur": 0.444, + "args": { + "External id": 228548,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115453815.755, "dur": 26.815, + "args": { + "External id": 228549,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115453844.453, "dur": 6.390, + "args": { + "External id": 228550,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115453849.310, "dur": 1.188, + "args": { + "External id": 228551,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115453852.610, "dur": 39.031, + "args": { + "External id": 228552,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115453867.840, "dur": 1.763, + "args": { + "External id": 228553,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115453871.261, "dur": 20.080, + "args": { + "External id": 228554,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115453875.070, "dur": 2.994, + "args": { + "External id": 228555,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115453893.595, "dur": 22.556, + "args": { + "External id": 228556,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115453918.406, "dur": 16.611, + "args": { + "External id": 228557,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115453938.117, "dur": 15.206, + "args": { + "External id": 228558,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115453955.182, "dur": 18.766, + "args": { + "External id": 228559,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115453975.858, "dur": 24.853, + "args": { + "External id": 228560,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115453980.461, "dur": 1.675, + "args": { + "External id": 228561,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115453984.723, "dur": 1.121, + "args": { + "External id": 228562,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115454002.364, "dur": 12.620, + "args": { + "External id": 228563,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115454016.712, "dur": 12.302, + "args": { + "External id": 228564,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115454037.882, "dur": 2.525, + "args": { + "External id": 228565,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115454046.912, "dur": 4.103, + "args": { + "External id": 228566,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454049.557, "dur": 0.615, + "args": { + "External id": 228567,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115454126.100, "dur": 57.315, + "args": { + "External id": 228568,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115454188.735, "dur": 6.667, + "args": { + "External id": 228569,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454191.633, "dur": 0.956, + "args": { + "External id": 228570,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115454197.433, "dur": 26.549, + "args": { + "External id": 228571,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115454229.315, "dur": 6.603, + "args": { + "External id": 228572,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115454231.422, "dur": 3.677, + "args": { + "External id": 228573,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454233.368, "dur": 1.476, + "args": { + "External id": 228574,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115454239.071, "dur": 46.848, + "args": { + "External id": 228575,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115454240.611, "dur": 44.692, + "args": { + "External id": 228576,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115454290.487, "dur": 15.066, + "args": { + "External id": 228577,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115454311.720, "dur": 4.691, + "args": { + "External id": 228578,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454314.301, "dur": 1.087, + "args": { + "External id": 228579,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115454320.753, "dur": 51.779, + "args": { + "External id": 228580,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115454322.312, "dur": 4.443, + "args": { + "External id": 228581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115454323.186, "dur": 2.931, + "args": { + "External id": 228582,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454325.104, "dur": 0.862, + "args": { + "External id": 228583,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115454327.477, "dur": 44.735, + "args": { + "External id": 228584,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115454328.486, "dur": 43.101, + "args": { + "External id": 228585,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115454376.414, "dur": 3.956, + "args": { + "External id": 228586,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454378.441, "dur": 0.724, + "args": { + "External id": 228587,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115454385.877, "dur": 1.538, + "args": { + "External id": 228588,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115454395.078, "dur": 6.714, + "args": { + "External id": 228589,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115454397.603, "dur": 3.884, + "args": { + "External id": 228590,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115454487.537, "dur": 312.701, + "args": { + "External id": 228591,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115454509.853, "dur": 3.326, + "args": { + "External id": 228592,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115454515.192, "dur": 284.417, + "args": { + "External id": 228593,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115454516.675, "dur": 0.300, + "args": { + "External id": 228594,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115454518.216, "dur": 23.722, + "args": { + "External id": 228595,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115454543.446, "dur": 6.233, + "args": { + "External id": 228596,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454548.340, "dur": 1.069, + "args": { + "External id": 228597,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115454550.548, "dur": 21.421, + "args": { + "External id": 228598,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115454551.804, "dur": 1.533, + "args": { + "External id": 228599,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115454554.877, "dur": 16.704, + "args": { + "External id": 228600,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115454557.564, "dur": 2.791, + "args": { + "External id": 228601,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115454573.769, "dur": 20.222, + "args": { + "External id": 228602,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115454595.635, "dur": 14.478, + "args": { + "External id": 228603,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115454612.855, "dur": 14.417, + "args": { + "External id": 228604,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115454629.272, "dur": 13.263, + "args": { + "External id": 228605,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115454644.425, "dur": 67.164, + "args": { + "External id": 228606,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115454646.381, "dur": 1.867, + "args": { + "External id": 228607,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454650.949, "dur": 33.849, + "args": { + "External id": 228608,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115454714.169, "dur": 39.573, + "args": { + "External id": 228609,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115454754.923, "dur": 43.773, + "args": { + "External id": 228610,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115454808.781, "dur": 2.524, + "args": { + "External id": 228611,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115454821.245, "dur": 3.901, + "args": { + "External id": 228612,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454823.771, "dur": 0.490, + "args": { + "External id": 228613,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115454899.081, "dur": 49.679, + "args": { + "External id": 228614,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115454953.528, "dur": 5.117, + "args": { + "External id": 228615,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454956.286, "dur": 1.116, + "args": { + "External id": 228616,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115454960.517, "dur": 24.685, + "args": { + "External id": 228617,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115454990.335, "dur": 6.484, + "args": { + "External id": 228618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115454992.244, "dur": 3.771, + "args": { + "External id": 228619,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115454994.332, "dur": 1.469, + "args": { + "External id": 228620,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115454999.899, "dur": 44.855, + "args": { + "External id": 228621,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115455000.998, "dur": 43.113, + "args": { + "External id": 228622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115455048.750, "dur": 14.537, + "args": { + "External id": 228623,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115455068.897, "dur": 4.146, + "args": { + "External id": 228624,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455071.353, "dur": 0.795, + "args": { + "External id": 228625,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115455077.446, "dur": 63.457, + "args": { + "External id": 228626,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115455078.871, "dur": 4.508, + "args": { + "External id": 228627,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115455079.683, "dur": 3.185, + "args": { + "External id": 228628,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455081.793, "dur": 0.918, + "args": { + "External id": 228629,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115455096.174, "dur": 44.408, + "args": { + "External id": 228630,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115455099.145, "dur": 40.870, + "args": { + "External id": 228631,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115455144.972, "dur": 4.197, + "args": { + "External id": 228632,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455147.122, "dur": 0.867, + "args": { + "External id": 228633,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115455154.787, "dur": 1.755, + "args": { + "External id": 228634,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455163.876, "dur": 7.939, + "args": { + "External id": 228635,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455166.395, "dur": 5.119, + "args": { + "External id": 228636,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115455255.188, "dur": 170.650, + "args": { + "External id": 228637,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455257.303, "dur": 1.893, + "args": { + "External id": 228638,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115455260.986, "dur": 164.382, + "args": { + "External id": 228639,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115455262.533, "dur": 0.338, + "args": { + "External id": 228640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115455264.113, "dur": 21.890, + "args": { + "External id": 228641,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115455287.709, "dur": 2.975, + "args": { + "External id": 228642,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455289.651, "dur": 0.819, + "args": { + "External id": 228643,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115455292.080, "dur": 23.653, + "args": { + "External id": 228644,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455293.293, "dur": 1.802, + "args": { + "External id": 228645,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115455296.133, "dur": 19.282, + "args": { + "External id": 228646,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115455301.349, "dur": 2.333, + "args": { + "External id": 228647,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115455317.755, "dur": 18.399, + "args": { + "External id": 228648,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115455337.756, "dur": 13.137, + "args": { + "External id": 228649,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115455353.679, "dur": 12.955, + "args": { + "External id": 228650,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115455367.850, "dur": 11.376, + "args": { + "External id": 228651,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115455380.979, "dur": 18.979, + "args": { + "External id": 228652,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115455383.028, "dur": 1.592, + "args": { + "External id": 228653,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455387.033, "dur": 0.837, + "args": { + "External id": 228654,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115455401.884, "dur": 10.822, + "args": { + "External id": 228655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115455413.766, "dur": 10.224, + "args": { + "External id": 228656,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115455434.706, "dur": 1.489, + "args": { + "External id": 228657,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115455444.516, "dur": 3.217, + "args": { + "External id": 228658,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455446.612, "dur": 0.406, + "args": { + "External id": 228659,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115455530.412, "dur": 44.431, + "args": { + "External id": 228660,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115455580.367, "dur": 8.122, + "args": { + "External id": 228661,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455583.860, "dur": 3.133, + "args": { + "External id": 228662,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115455589.827, "dur": 27.955, + "args": { + "External id": 228663,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115455622.962, "dur": 5.606, + "args": { + "External id": 228664,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115455624.467, "dur": 3.242, + "args": { + "External id": 228665,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455626.435, "dur": 0.956, + "args": { + "External id": 228666,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115455630.960, "dur": 78.361, + "args": { + "External id": 228667,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115455632.116, "dur": 75.742, + "args": { + "External id": 228668,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115455714.803, "dur": 15.320, + "args": { + "External id": 228669,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115455737.213, "dur": 5.097, + "args": { + "External id": 228670,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455740.079, "dur": 1.054, + "args": { + "External id": 228671,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115455746.522, "dur": 52.423, + "args": { + "External id": 228672,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115455747.455, "dur": 5.173, + "args": { + "External id": 228673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115455748.756, "dur": 3.306, + "args": { + "External id": 228674,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455750.753, "dur": 1.146, + "args": { + "External id": 228675,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115455753.641, "dur": 44.924, + "args": { + "External id": 228676,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115455754.536, "dur": 43.400, + "args": { + "External id": 228677,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115455803.167, "dur": 4.093, + "args": { + "External id": 228678,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455805.164, "dur": 0.840, + "args": { + "External id": 228679,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115455813.810, "dur": 1.606, + "args": { + "External id": 228680,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455823.444, "dur": 6.625, + "args": { + "External id": 228681,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455825.445, "dur": 4.378, + "args": { + "External id": 228682,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115455915.071, "dur": 188.631, + "args": { + "External id": 228683,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455917.041, "dur": 4.171, + "args": { + "External id": 228684,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115455923.177, "dur": 179.989, + "args": { + "External id": 228685,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115455924.649, "dur": 0.388, + "args": { + "External id": 228686,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115455926.425, "dur": 21.467, + "args": { + "External id": 228687,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115455949.363, "dur": 6.053, + "args": { + "External id": 228688,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115455954.022, "dur": 1.153, + "args": { + "External id": 228689,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115455956.485, "dur": 21.234, + "args": { + "External id": 228690,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115455957.505, "dur": 1.814, + "args": { + "External id": 228691,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115455960.865, "dur": 16.544, + "args": { + "External id": 228692,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115455963.181, "dur": 2.454, + "args": { + "External id": 228693,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115455979.355, "dur": 21.375, + "args": { + "External id": 228694,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115456002.505, "dur": 13.102, + "args": { + "External id": 228695,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115456018.589, "dur": 16.495, + "args": { + "External id": 228696,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115456036.513, "dur": 13.138, + "args": { + "External id": 228697,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115456051.389, "dur": 23.031, + "args": { + "External id": 228698,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115456053.191, "dur": 1.625, + "args": { + "External id": 228699,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456057.035, "dur": 2.915, + "args": { + "External id": 228700,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115456076.224, "dur": 12.820, + "args": { + "External id": 228701,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115456090.269, "dur": 11.579, + "args": { + "External id": 228702,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115456109.767, "dur": 1.717, + "args": { + "External id": 228703,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115456119.478, "dur": 3.572, + "args": { + "External id": 228704,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456121.704, "dur": 0.419, + "args": { + "External id": 228705,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115456183.164, "dur": 39.995, + "args": { + "External id": 228706,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115456227.457, "dur": 5.136, + "args": { + "External id": 228707,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456230.386, "dur": 1.257, + "args": { + "External id": 228708,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115456234.219, "dur": 21.811, + "args": { + "External id": 228709,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115456260.183, "dur": 5.728, + "args": { + "External id": 228710,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115456261.691, "dur": 3.527, + "args": { + "External id": 228711,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456263.783, "dur": 1.215, + "args": { + "External id": 228712,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115456267.901, "dur": 42.175, + "args": { + "External id": 228713,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115456269.163, "dur": 40.200, + "args": { + "External id": 228714,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115456313.718, "dur": 15.134, + "args": { + "External id": 228715,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115456334.403, "dur": 4.179, + "args": { + "External id": 228716,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456337.063, "dur": 0.665, + "args": { + "External id": 228717,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115456342.402, "dur": 48.967, + "args": { + "External id": 228718,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115456343.255, "dur": 3.863, + "args": { + "External id": 228719,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115456344.160, "dur": 2.408, + "args": { + "External id": 228720,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456345.687, "dur": 0.745, + "args": { + "External id": 228721,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115456348.295, "dur": 42.684, + "args": { + "External id": 228722,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115456348.714, "dur": 41.651, + "args": { + "External id": 228723,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115456395.625, "dur": 3.728, + "args": { + "External id": 228724,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456397.778, "dur": 0.552, + "args": { + "External id": 228725,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115456404.878, "dur": 1.444, + "args": { + "External id": 228726,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115456413.551, "dur": 5.804, + "args": { + "External id": 228727,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115456415.531, "dur": 3.528, + "args": { + "External id": 228728,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115456515.766, "dur": 230.354, + "args": { + "External id": 228729,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115456520.459, "dur": 3.491, + "args": { + "External id": 228730,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115456525.985, "dur": 219.499, + "args": { + "External id": 228731,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115456527.504, "dur": 0.508, + "args": { + "External id": 228732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115456529.227, "dur": 26.218, + "args": { + "External id": 228733,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115456557.158, "dur": 6.497, + "args": { + "External id": 228734,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456561.808, "dur": 1.624, + "args": { + "External id": 228735,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115456564.659, "dur": 22.232, + "args": { + "External id": 228736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115456566.002, "dur": 1.779, + "args": { + "External id": 228737,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115456569.299, "dur": 17.257, + "args": { + "External id": 228738,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115456571.624, "dur": 2.395, + "args": { + "External id": 228739,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115456588.436, "dur": 19.800, + "args": { + "External id": 228740,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115456609.814, "dur": 17.310, + "args": { + "External id": 228741,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115456629.594, "dur": 14.080, + "args": { + "External id": 228742,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115456645.152, "dur": 47.208, + "args": { + "External id": 228743,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115456695.505, "dur": 23.589, + "args": { + "External id": 228744,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115456697.438, "dur": 1.903, + "args": { + "External id": 228745,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456701.918, "dur": 0.968, + "args": { + "External id": 228746,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115456721.027, "dur": 11.727, + "args": { + "External id": 228747,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115456734.287, "dur": 9.851, + "args": { + "External id": 228748,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115456753.822, "dur": 2.365, + "args": { + "External id": 228749,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115456766.221, "dur": 4.007, + "args": { + "External id": 228750,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456768.693, "dur": 0.668, + "args": { + "External id": 228751,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115456840.386, "dur": 50.089, + "args": { + "External id": 228752,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115456895.375, "dur": 5.179, + "args": { + "External id": 228753,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456898.414, "dur": 1.140, + "args": { + "External id": 228754,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115456902.435, "dur": 23.369, + "args": { + "External id": 228755,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115456930.442, "dur": 6.593, + "args": { + "External id": 228756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115456932.587, "dur": 3.707, + "args": { + "External id": 228757,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115456934.873, "dur": 1.205, + "args": { + "External id": 228758,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115456939.763, "dur": 43.968, + "args": { + "External id": 228759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115456941.000, "dur": 41.940, + "args": { + "External id": 228760,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115456987.478, "dur": 13.341, + "args": { + "External id": 228761,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115457006.370, "dur": 4.244, + "args": { + "External id": 228762,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457009.010, "dur": 0.720, + "args": { + "External id": 228763,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115457014.467, "dur": 48.081, + "args": { + "External id": 228764,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115457015.304, "dur": 4.185, + "args": { + "External id": 228765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115457016.144, "dur": 2.720, + "args": { + "External id": 228766,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457017.927, "dur": 0.782, + "args": { + "External id": 228767,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115457020.101, "dur": 42.046, + "args": { + "External id": 228768,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115457021.257, "dur": 40.227, + "args": { + "External id": 228769,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115457066.611, "dur": 3.747, + "args": { + "External id": 228770,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457068.388, "dur": 0.763, + "args": { + "External id": 228771,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115457076.424, "dur": 1.496, + "args": { + "External id": 228772,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457085.333, "dur": 8.200, + "args": { + "External id": 228773,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457087.587, "dur": 5.683, + "args": { + "External id": 228774,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115457177.199, "dur": 184.454, + "args": { + "External id": 228775,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457179.110, "dur": 2.154, + "args": { + "External id": 228776,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115457182.736, "dur": 178.447, + "args": { + "External id": 228777,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115457184.129, "dur": 0.392, + "args": { + "External id": 228778,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115457185.842, "dur": 22.175, + "args": { + "External id": 228779,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115457209.886, "dur": 3.037, + "args": { + "External id": 228780,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457211.755, "dur": 0.954, + "args": { + "External id": 228781,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115457214.052, "dur": 24.012, + "args": { + "External id": 228782,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457215.564, "dur": 1.686, + "args": { + "External id": 228783,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115457218.295, "dur": 19.415, + "args": { + "External id": 228784,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115457222.949, "dur": 2.217, + "args": { + "External id": 228785,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115457239.759, "dur": 22.780, + "args": { + "External id": 228786,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115457264.182, "dur": 13.098, + "args": { + "External id": 228787,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115457280.029, "dur": 15.521, + "args": { + "External id": 228788,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115457297.072, "dur": 12.664, + "args": { + "External id": 228789,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115457311.300, "dur": 21.133, + "args": { + "External id": 228790,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115457313.315, "dur": 1.832, + "args": { + "External id": 228791,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457317.732, "dur": 0.596, + "args": { + "External id": 228792,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115457334.375, "dur": 12.399, + "args": { + "External id": 228793,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115457347.783, "dur": 12.072, + "args": { + "External id": 228794,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115457367.069, "dur": 1.498, + "args": { + "External id": 228795,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115457376.560, "dur": 3.054, + "args": { + "External id": 228796,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457378.419, "dur": 0.394, + "args": { + "External id": 228797,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115457448.956, "dur": 61.041, + "args": { + "External id": 228798,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115457516.609, "dur": 8.406, + "args": { + "External id": 228799,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457520.306, "dur": 3.127, + "args": { + "External id": 228800,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115457526.364, "dur": 26.990, + "args": { + "External id": 228801,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115457558.412, "dur": 5.746, + "args": { + "External id": 228802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115457560.082, "dur": 3.373, + "args": { + "External id": 228803,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457562.256, "dur": 1.002, + "args": { + "External id": 228804,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115457566.969, "dur": 78.968, + "args": { + "External id": 228805,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115457568.482, "dur": 76.925, + "args": { + "External id": 228806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115457649.533, "dur": 52.852, + "args": { + "External id": 228807,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115457710.815, "dur": 5.236, + "args": { + "External id": 228808,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457713.900, "dur": 0.993, + "args": { + "External id": 228809,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115457720.664, "dur": 57.410, + "args": { + "External id": 228810,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115457721.642, "dur": 4.414, + "args": { + "External id": 228811,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115457722.665, "dur": 2.847, + "args": { + "External id": 228812,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457724.432, "dur": 0.911, + "args": { + "External id": 228813,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115457727.241, "dur": 50.367, + "args": { + "External id": 228814,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115457728.032, "dur": 49.092, + "args": { + "External id": 228815,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115457781.909, "dur": 3.818, + "args": { + "External id": 228816,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457783.892, "dur": 0.694, + "args": { + "External id": 228817,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115457792.026, "dur": 1.694, + "args": { + "External id": 228818,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457801.398, "dur": 15.184, + "args": { + "External id": 228819,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457808.762, "dur": 7.543, + "args": { + "External id": 228820,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115457902.646, "dur": 182.121, + "args": { + "External id": 228821,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457904.680, "dur": 1.839, + "args": { + "External id": 228822,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115457908.035, "dur": 176.265, + "args": { + "External id": 228823,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115457909.790, "dur": 0.345, + "args": { + "External id": 228824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115457911.672, "dur": 24.938, + "args": { + "External id": 228825,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115457938.212, "dur": 3.134, + "args": { + "External id": 228826,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115457940.338, "dur": 0.813, + "args": { + "External id": 228827,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115457942.164, "dur": 23.617, + "args": { + "External id": 228828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115457943.563, "dur": 1.487, + "args": { + "External id": 228829,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115457946.448, "dur": 18.997, + "args": { + "External id": 228830,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115457951.306, "dur": 2.353, + "args": { + "External id": 228831,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115457967.420, "dur": 19.843, + "args": { + "External id": 228832,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115457988.673, "dur": 13.685, + "args": { + "External id": 228833,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115458004.891, "dur": 14.197, + "args": { + "External id": 228834,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115458020.875, "dur": 12.966, + "args": { + "External id": 228835,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115458035.915, "dur": 20.358, + "args": { + "External id": 228836,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115458037.783, "dur": 1.765, + "args": { + "External id": 228837,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458041.810, "dur": 0.885, + "args": { + "External id": 228838,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115458057.902, "dur": 13.252, + "args": { + "External id": 228839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115458072.183, "dur": 10.767, + "args": { + "External id": 228840,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115458090.533, "dur": 1.662, + "args": { + "External id": 228841,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115458100.737, "dur": 3.413, + "args": { + "External id": 228842,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458102.787, "dur": 0.587, + "args": { + "External id": 228843,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115458166.391, "dur": 39.805, + "args": { + "External id": 228844,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115458210.639, "dur": 5.065, + "args": { + "External id": 228845,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458213.569, "dur": 1.097, + "args": { + "External id": 228846,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115458217.074, "dur": 21.839, + "args": { + "External id": 228847,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115458243.537, "dur": 5.462, + "args": { + "External id": 228848,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115458244.928, "dur": 3.387, + "args": { + "External id": 228849,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458246.924, "dur": 1.186, + "args": { + "External id": 228850,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115458251.226, "dur": 41.216, + "args": { + "External id": 228851,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115458252.213, "dur": 39.510, + "args": { + "External id": 228852,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115458295.986, "dur": 15.297, + "args": { + "External id": 228853,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115458316.641, "dur": 3.955, + "args": { + "External id": 228854,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458318.786, "dur": 0.946, + "args": { + "External id": 228855,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115458324.071, "dur": 47.496, + "args": { + "External id": 228856,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115458324.972, "dur": 4.195, + "args": { + "External id": 228857,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115458325.828, "dur": 2.791, + "args": { + "External id": 228858,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458327.783, "dur": 0.696, + "args": { + "External id": 228859,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115458330.253, "dur": 40.977, + "args": { + "External id": 228860,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115458330.945, "dur": 39.743, + "args": { + "External id": 228861,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115458375.335, "dur": 5.531, + "args": { + "External id": 228862,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458377.123, "dur": 2.666, + "args": { + "External id": 228863,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115458385.818, "dur": 1.395, + "args": { + "External id": 228864,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115458419.823, "dur": 7.172, + "args": { + "External id": 228865,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115458422.599, "dur": 4.126, + "args": { + "External id": 228866,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115458524.209, "dur": 221.967, + "args": { + "External id": 228867,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115458526.520, "dur": 2.832, + "args": { + "External id": 228868,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115458533.693, "dur": 212.039, + "args": { + "External id": 228869,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115458535.221, "dur": 0.318, + "args": { + "External id": 228870,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115458536.625, "dur": 22.633, + "args": { + "External id": 228871,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115458560.698, "dur": 6.109, + "args": { + "External id": 228872,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458562.931, "dur": 3.505, + "args": { + "External id": 228873,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115458567.586, "dur": 21.873, + "args": { + "External id": 228874,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115458568.836, "dur": 1.907, + "args": { + "External id": 228875,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115458572.117, "dur": 17.072, + "args": { + "External id": 228876,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115458574.598, "dur": 2.265, + "args": { + "External id": 228877,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115458591.097, "dur": 20.150, + "args": { + "External id": 228878,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115458612.909, "dur": 13.015, + "args": { + "External id": 228879,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115458628.839, "dur": 14.565, + "args": { + "External id": 228880,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115458644.901, "dur": 46.140, + "args": { + "External id": 228881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115458694.068, "dur": 23.081, + "args": { + "External id": 228882,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115458696.428, "dur": 1.911, + "args": { + "External id": 228883,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458700.646, "dur": 0.651, + "args": { + "External id": 228884,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115458718.689, "dur": 12.763, + "args": { + "External id": 228885,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115458732.848, "dur": 11.786, + "args": { + "External id": 228886,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115458753.077, "dur": 2.459, + "args": { + "External id": 228887,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115458765.734, "dur": 3.633, + "args": { + "External id": 228888,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458768.189, "dur": 0.408, + "args": { + "External id": 228889,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115458833.887, "dur": 48.933, + "args": { + "External id": 228890,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115458887.523, "dur": 6.691, + "args": { + "External id": 228891,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458890.312, "dur": 2.644, + "args": { + "External id": 228892,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115458895.920, "dur": 23.602, + "args": { + "External id": 228893,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115458924.385, "dur": 6.113, + "args": { + "External id": 228894,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115458926.540, "dur": 3.228, + "args": { + "External id": 228895,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115458928.855, "dur": 0.723, + "args": { + "External id": 228896,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115458933.392, "dur": 41.940, + "args": { + "External id": 228897,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115458934.585, "dur": 40.184, + "args": { + "External id": 228898,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115458978.998, "dur": 15.127, + "args": { + "External id": 228899,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115458998.837, "dur": 24.352, + "args": { + "External id": 228900,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115459001.220, "dur": 21.575, + "args": { + "External id": 228901,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459006.065, "dur": 1.079, + "args": { + "External id": 228902,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115459028.200, "dur": 29.802, + "args": { + "External id": 228903,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115459033.713, "dur": 24.083, + "args": { + "External id": 228904,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 7703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459038.817, "dur": 3.896, + "args": { + "External id": 228905,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115459043.825, "dur": 13.512, + "args": { + "External id": 228906,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115459070.696, "dur": 5.060, + "args": { + "External id": 228907,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115459072.839, "dur": 2.626, + "args": { + "External id": 228908,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115459076.931, "dur": 1.538, + "args": { + "External id": 228909,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115459077.797, "dur": 0.600, + "args": { + "External id": 228910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115459116.849, "dur": 23.107, + "args": { + "External id": 228911,"Sequence number": 2757940, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 7710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115459142.258, "dur": 14.729, + "args": { + "External id": 228912,"Sequence number": 2757941, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 7711 + } + }, + { + "ph": "s", "id": 16, "pid": 4183442, "tid": 4183442, "ts": 667115459142.258, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115459162.414, "dur": 5.666, + "args": { + "External id": 228913,"Sequence number": 2757942, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 7712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459165.698, "dur": 1.014, + "args": { + "External id": 228914,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115459170.471, "dur": 7.776, + "args": { + "External id": 228915,"Sequence number": 2757942, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 7714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459175.837, "dur": 1.129, + "args": { + "External id": 228916,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115459179.416, "dur": 3.434, + "args": { + "External id": 228917,"Sequence number": 2757942, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 7716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459181.465, "dur": 0.775, + "args": { + "External id": 228918,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 7717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115459187.253, "dur": 5.846, + "args": { + "External id": 228919,"Sequence number": 2757942, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7718 + } + }, + { + "ph": "s", "id": 15, "pid": 4183442, "tid": 4183442, "ts": 667115459187.253, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459190.888, "dur": 0.826, + "args": { + "External id": 228920,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115459194.196, "dur": 5.206, + "args": { + "External id": 228921,"Sequence number": 2757943, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7720 + } + }, + { + "ph": "s", "id": 14, "pid": 4183442, "tid": 4183442, "ts": 667115459194.196, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459197.797, "dur": 0.797, + "args": { + "External id": 228922,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115459200.433, "dur": 5.228, + "args": { + "External id": 228923,"Sequence number": 2757944, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 7722 + } + }, + { + "ph": "s", "id": 13, "pid": 4183442, "tid": 4183442, "ts": 667115459200.433, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459203.869, "dur": 0.934, + "args": { + "External id": 228924,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115459206.679, "dur": 5.174, + "args": { + "External id": 228925,"Sequence number": 2757945, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 7724 + } + }, + { + "ph": "s", "id": 12, "pid": 4183442, "tid": 4183442, "ts": 667115459206.679, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459209.520, "dur": 1.568, + "args": { + "External id": 228926,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 7725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115459215.648, "dur": 32.765, + "args": { + "External id": 228927,"Sequence number": 2757946, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115459217.145, "dur": 31.072, + "args": { + "External id": 228928,"Sequence number": 2757946, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115459219.868, "dur": 6.717, + "args": { + "External id": 228929,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 7728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115459222.514, "dur": 3.512, + "args": { + "External id": 228930,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115459227.470, "dur": 20.222, + "args": { + "External id": 228931,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 7730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115459273.770, "dur": 3.891, + "args": { + "External id": 228932,"Sequence number": 2757946, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 7731 + } + }, + { + "ph": "s", "id": 11, "pid": 4183442, "tid": 4183442, "ts": 667115459273.770, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115459280.036, "dur": 3.556, + "args": { + "External id": 228933,"Sequence number": 2757947, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115459315.616, "dur": 23079.796, + "args": { + "External id": 228934,"Sequence number": 2757947, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 7733 + } + }, + { + "ph": "s", "id": 10, "pid": 4183442, "tid": 4183442, "ts": 667115459315.616, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115459330.223, "dur": 28.093, + "args": { + "External id": 228935,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115459331.016, "dur": 27.108, + "args": { + "External id": 228936,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115459332.373, "dur": 5.311, + "args": { + "External id": 228937,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115459333.456, "dur": 3.790, + "args": { + "External id": 228938,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115459338.318, "dur": 19.364, + "args": { + "External id": 228939,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 7738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115459373.008, "dur": 27.040, + "args": { + "External id": 228940,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115459374.198, "dur": 6.116, + "args": { + "External id": 228941,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459376.234, "dur": 3.675, + "args": { + "External id": 228942,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115459381.557, "dur": 18.278, + "args": { + "External id": 228943,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115459383.582, "dur": 15.762, + "args": { + "External id": 228944,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115459403.372, "dur": 21.056, + "args": { + "External id": 228945,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115459404.217, "dur": 4.962, + "args": { + "External id": 228946,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459405.764, "dur": 3.111, + "args": { + "External id": 228947,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115459410.006, "dur": 14.231, + "args": { + "External id": 228948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115459411.137, "dur": 12.800, + "args": { + "External id": 228949,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 7748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115459430.505, "dur": 19.626, + "args": { + "External id": 228950,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 7749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115459432.588, "dur": 5.048, + "args": { + "External id": 228951,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115459438.284, "dur": 11.601, + "args": { + "External id": 228952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 7751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115459439.011, "dur": 10.542, + "args": { + "External id": 228953,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 4183442, + "ts": 667115459454.912, "dur": 22.575, + "args": { + "External id": 228954,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115459479.914, "dur": 76.562, + "args": { + "External id": 228955,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115459481.661, "dur": 74.289, + "args": { + "External id": 228956,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459486.470, "dur": 1.425, + "args": { + "External id": 228957,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115459489.228, "dur": 49.153, + "args": { + "External id": 228958,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115459510.570, "dur": 27.550, + "args": { + "External id": 228959,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 7758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115459515.315, "dur": 4.130, + "args": { + "External id": 228960,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115459520.444, "dur": 17.377, + "args": { + "External id": 228961,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 7760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 4183442, + "ts": 667115459560.843, "dur": 17312.380, + "args": { + "External id": 228962,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 4183442, + "ts": 667115459562.649, "dur": 17309.112, + "args": { + "External id": 228963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115476885.373, "dur": 6.923, + "args": { + "External id": 228964,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115476889.543, "dur": 1.008, + "args": { + "External id": 228965,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115476898.052, "dur": 105.946, + "args": { + "External id": 228966,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115476899.664, "dur": 6.564, + "args": { + "External id": 228967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115476901.782, "dur": 3.495, + "args": { + "External id": 228968,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115476904.044, "dur": 0.943, + "args": { + "External id": 228969,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115476907.604, "dur": 95.813, + "args": { + "External id": 228970,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115476909.815, "dur": 92.445, + "args": { + "External id": 228971,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115477007.796, "dur": 4.306, + "args": { + "External id": 228972,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477010.178, "dur": 0.670, + "args": { + "External id": 228973,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115477019.907, "dur": 2.875, + "args": { + "External id": 228974,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477031.698, "dur": 7.837, + "args": { + "External id": 228975,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477034.477, "dur": 4.776, + "args": { + "External id": 228976,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115477169.558, "dur": 196.462, + "args": { + "External id": 228977,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477173.117, "dur": 2.371, + "args": { + "External id": 228978,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115477177.061, "dur": 188.317, + "args": { + "External id": 228979,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115477181.631, "dur": 0.460, + "args": { + "External id": 228980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115477183.662, "dur": 26.121, + "args": { + "External id": 228981,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115477211.967, "dur": 3.408, + "args": { + "External id": 228982,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477214.086, "dur": 0.977, + "args": { + "External id": 228983,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115477216.608, "dur": 27.844, + "args": { + "External id": 228984,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477220.569, "dur": 1.318, + "args": { + "External id": 228985,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115477223.279, "dur": 20.883, + "args": { + "External id": 228986,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115477227.116, "dur": 3.053, + "args": { + "External id": 228987,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115477246.213, "dur": 22.437, + "args": { + "External id": 228988,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115477270.684, "dur": 14.579, + "args": { + "External id": 228989,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115477288.248, "dur": 14.612, + "args": { + "External id": 228990,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115477304.312, "dur": 12.286, + "args": { + "External id": 228991,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115477318.531, "dur": 20.049, + "args": { + "External id": 228992,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115477320.615, "dur": 1.701, + "args": { + "External id": 228993,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477324.888, "dur": 0.889, + "args": { + "External id": 228994,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115477340.231, "dur": 11.662, + "args": { + "External id": 228995,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115477353.610, "dur": 10.681, + "args": { + "External id": 228996,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115477373.029, "dur": 1.984, + "args": { + "External id": 228997,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115477381.026, "dur": 4.135, + "args": { + "External id": 228998,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477383.262, "dur": 1.036, + "args": { + "External id": 228999,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115477458.638, "dur": 69.933, + "args": { + "External id": 229000,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115477535.604, "dur": 9.374, + "args": { + "External id": 229001,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477538.882, "dur": 3.132, + "args": { + "External id": 229002,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115477546.946, "dur": 26.380, + "args": { + "External id": 229003,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115477579.801, "dur": 6.758, + "args": { + "External id": 229004,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115477581.842, "dur": 3.978, + "args": { + "External id": 229005,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477584.221, "dur": 1.324, + "args": { + "External id": 229006,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115477590.139, "dur": 50.846, + "args": { + "External id": 229007,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115477591.467, "dur": 48.854, + "args": { + "External id": 229008,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115477644.956, "dur": 49.118, + "args": { + "External id": 229009,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115477702.978, "dur": 5.469, + "args": { + "External id": 229010,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477706.539, "dur": 0.813, + "args": { + "External id": 229011,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115477713.556, "dur": 57.397, + "args": { + "External id": 229012,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115477714.662, "dur": 5.046, + "args": { + "External id": 229013,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115477715.890, "dur": 3.143, + "args": { + "External id": 229014,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477717.753, "dur": 1.033, + "args": { + "External id": 229015,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115477720.516, "dur": 50.052, + "args": { + "External id": 229016,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115477721.612, "dur": 48.414, + "args": { + "External id": 229017,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115477775.111, "dur": 3.700, + "args": { + "External id": 229018,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477777.236, "dur": 0.562, + "args": { + "External id": 229019,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115477785.591, "dur": 1.853, + "args": { + "External id": 229020,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477795.179, "dur": 7.867, + "args": { + "External id": 229021,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477798.049, "dur": 4.713, + "args": { + "External id": 229022,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115477904.525, "dur": 276.027, + "args": { + "External id": 229023,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477906.348, "dur": 3.699, + "args": { + "External id": 229024,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115477911.759, "dur": 268.172, + "args": { + "External id": 229025,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115477913.171, "dur": 0.360, + "args": { + "External id": 229026,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115477914.697, "dur": 23.054, + "args": { + "External id": 229027,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115477939.581, "dur": 5.849, + "args": { + "External id": 229028,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115477944.350, "dur": 0.860, + "args": { + "External id": 229029,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115477946.677, "dur": 32.048, + "args": { + "External id": 229030,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115477947.825, "dur": 1.581, + "args": { + "External id": 229031,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115477960.522, "dur": 17.945, + "args": { + "External id": 229032,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115477963.419, "dur": 2.656, + "args": { + "External id": 229033,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115477980.383, "dur": 21.629, + "args": { + "External id": 229034,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115478003.733, "dur": 15.014, + "args": { + "External id": 229035,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115478021.543, "dur": 15.660, + "args": { + "External id": 229036,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115478038.592, "dur": 14.890, + "args": { + "External id": 229037,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115478055.555, "dur": 34.046, + "args": { + "External id": 229038,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115478060.150, "dur": 1.576, + "args": { + "External id": 229039,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478064.475, "dur": 1.073, + "args": { + "External id": 229040,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115478091.258, "dur": 42.987, + "args": { + "External id": 229041,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115478135.509, "dur": 43.456, + "args": { + "External id": 229042,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115478187.158, "dur": 2.066, + "args": { + "External id": 229043,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115478198.143, "dur": 3.425, + "args": { + "External id": 229044,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478200.136, "dur": 0.630, + "args": { + "External id": 229045,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115478270.468, "dur": 43.164, + "args": { + "External id": 229046,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115478318.470, "dur": 5.238, + "args": { + "External id": 229047,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478321.720, "dur": 0.929, + "args": { + "External id": 229048,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115478325.394, "dur": 23.980, + "args": { + "External id": 229049,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115478354.025, "dur": 6.544, + "args": { + "External id": 229050,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115478355.976, "dur": 3.894, + "args": { + "External id": 229051,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478357.928, "dur": 1.706, + "args": { + "External id": 229052,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115478362.969, "dur": 44.191, + "args": { + "External id": 229053,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115478363.910, "dur": 42.675, + "args": { + "External id": 229054,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115478411.139, "dur": 14.570, + "args": { + "External id": 229055,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115478431.742, "dur": 4.156, + "args": { + "External id": 229056,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478434.062, "dur": 1.056, + "args": { + "External id": 229057,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115478439.698, "dur": 47.742, + "args": { + "External id": 229058,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115478440.287, "dur": 4.184, + "args": { + "External id": 229059,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115478441.326, "dur": 2.574, + "args": { + "External id": 229060,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478442.719, "dur": 1.030, + "args": { + "External id": 229061,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115478445.047, "dur": 42.074, + "args": { + "External id": 229062,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115478446.260, "dur": 40.127, + "args": { + "External id": 229063,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115478508.301, "dur": 5.112, + "args": { + "External id": 229064,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478510.817, "dur": 1.014, + "args": { + "External id": 229065,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115478521.196, "dur": 1.887, + "args": { + "External id": 229066,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115478530.504, "dur": 6.817, + "args": { + "External id": 229067,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115478532.905, "dur": 4.108, + "args": { + "External id": 229068,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115478623.249, "dur": 215.771, + "args": { + "External id": 229069,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115478627.663, "dur": 2.392, + "args": { + "External id": 229070,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115478631.553, "dur": 206.988, + "args": { + "External id": 229071,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115478633.049, "dur": 0.615, + "args": { + "External id": 229072,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115478634.967, "dur": 55.329, + "args": { + "External id": 229073,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115478693.178, "dur": 5.640, + "args": { + "External id": 229074,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478697.439, "dur": 1.111, + "args": { + "External id": 229075,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115478699.687, "dur": 23.106, + "args": { + "External id": 229076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115478700.774, "dur": 2.332, + "args": { + "External id": 229077,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115478704.579, "dur": 17.940, + "args": { + "External id": 229078,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115478707.466, "dur": 3.044, + "args": { + "External id": 229079,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115478724.425, "dur": 20.073, + "args": { + "External id": 229080,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115478746.034, "dur": 15.917, + "args": { + "External id": 229081,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115478764.386, "dur": 13.878, + "args": { + "External id": 229082,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115478779.447, "dur": 12.381, + "args": { + "External id": 229083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115478793.803, "dur": 18.959, + "args": { + "External id": 229084,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115478795.936, "dur": 1.737, + "args": { + "External id": 229085,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478799.616, "dur": 0.938, + "args": { + "External id": 229086,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115478814.524, "dur": 11.396, + "args": { + "External id": 229087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115478827.197, "dur": 10.318, + "args": { + "External id": 229088,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115478846.671, "dur": 2.353, + "args": { + "External id": 229089,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115478858.034, "dur": 4.127, + "args": { + "External id": 229090,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478860.693, "dur": 0.647, + "args": { + "External id": 229091,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115478929.890, "dur": 47.449, + "args": { + "External id": 229092,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115478982.270, "dur": 4.877, + "args": { + "External id": 229093,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115478985.161, "dur": 0.875, + "args": { + "External id": 229094,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115478988.628, "dur": 29.381, + "args": { + "External id": 229095,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115479022.538, "dur": 6.377, + "args": { + "External id": 229096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115479024.163, "dur": 3.971, + "args": { + "External id": 229097,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479026.179, "dur": 1.766, + "args": { + "External id": 229098,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115479031.162, "dur": 43.318, + "args": { + "External id": 229099,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115479032.330, "dur": 41.316, + "args": { + "External id": 229100,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115479078.073, "dur": 13.448, + "args": { + "External id": 229101,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115479097.651, "dur": 4.381, + "args": { + "External id": 229102,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479100.132, "dur": 1.022, + "args": { + "External id": 229103,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115479105.949, "dur": 47.615, + "args": { + "External id": 229104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115479107.446, "dur": 4.507, + "args": { + "External id": 229105,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115479108.176, "dur": 3.223, + "args": { + "External id": 229106,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479110.368, "dur": 0.904, + "args": { + "External id": 229107,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115479112.609, "dur": 40.628, + "args": { + "External id": 229108,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115479113.330, "dur": 39.259, + "args": { + "External id": 229109,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115479157.504, "dur": 3.477, + "args": { + "External id": 229110,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479159.145, "dur": 0.896, + "args": { + "External id": 229111,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115479165.816, "dur": 1.737, + "args": { + "External id": 229112,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479174.613, "dur": 8.532, + "args": { + "External id": 229113,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479176.512, "dur": 6.320, + "args": { + "External id": 229114,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115479261.695, "dur": 161.265, + "args": { + "External id": 229115,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479263.601, "dur": 2.320, + "args": { + "External id": 229116,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115479267.346, "dur": 155.127, + "args": { + "External id": 229117,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115479268.862, "dur": 0.265, + "args": { + "External id": 229118,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115479270.424, "dur": 20.329, + "args": { + "External id": 229119,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115479292.114, "dur": 3.201, + "args": { + "External id": 229120,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479294.440, "dur": 0.680, + "args": { + "External id": 229121,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115479296.158, "dur": 21.802, + "args": { + "External id": 229122,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479297.120, "dur": 1.426, + "args": { + "External id": 229123,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115479299.751, "dur": 17.864, + "args": { + "External id": 229124,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115479303.699, "dur": 2.392, + "args": { + "External id": 229125,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115479319.364, "dur": 17.340, + "args": { + "External id": 229126,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115479338.160, "dur": 11.715, + "args": { + "External id": 229127,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115479352.583, "dur": 13.034, + "args": { + "External id": 229128,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115479366.843, "dur": 10.523, + "args": { + "External id": 229129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115479378.929, "dur": 18.952, + "args": { + "External id": 229130,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115479380.984, "dur": 1.215, + "args": { + "External id": 229131,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479384.563, "dur": 0.975, + "args": { + "External id": 229132,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115479399.531, "dur": 10.597, + "args": { + "External id": 229133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115479411.554, "dur": 10.001, + "args": { + "External id": 229134,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115479428.615, "dur": 1.528, + "args": { + "External id": 229135,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115479437.570, "dur": 3.283, + "args": { + "External id": 229136,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479439.654, "dur": 0.437, + "args": { + "External id": 229137,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115479518.301, "dur": 44.014, + "args": { + "External id": 229138,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115479567.855, "dur": 5.999, + "args": { + "External id": 229139,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479571.238, "dur": 1.376, + "args": { + "External id": 229140,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115479575.420, "dur": 22.505, + "args": { + "External id": 229141,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115479602.869, "dur": 5.492, + "args": { + "External id": 229142,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115479604.229, "dur": 3.460, + "args": { + "External id": 229143,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479606.187, "dur": 1.315, + "args": { + "External id": 229144,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115479610.580, "dur": 79.317, + "args": { + "External id": 229145,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115479611.772, "dur": 76.752, + "args": { + "External id": 229146,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115479695.526, "dur": 18.761, + "args": { + "External id": 229147,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115479720.706, "dur": 5.250, + "args": { + "External id": 229148,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479723.619, "dur": 1.041, + "args": { + "External id": 229149,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115479730.065, "dur": 70.025, + "args": { + "External id": 229150,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115479731.070, "dur": 6.656, + "args": { + "External id": 229151,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115479731.970, "dur": 5.146, + "args": { + "External id": 229152,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479733.764, "dur": 3.129, + "args": { + "External id": 229153,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115479750.604, "dur": 49.024, + "args": { + "External id": 229154,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115479751.652, "dur": 47.032, + "args": { + "External id": 229155,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115479804.360, "dur": 4.065, + "args": { + "External id": 229156,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479806.510, "dur": 0.825, + "args": { + "External id": 229157,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115479814.354, "dur": 2.190, + "args": { + "External id": 229158,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479824.048, "dur": 6.520, + "args": { + "External id": 229159,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479826.373, "dur": 3.908, + "args": { + "External id": 229160,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115479922.329, "dur": 184.992, + "args": { + "External id": 229161,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479926.539, "dur": 1.998, + "args": { + "External id": 229162,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115479930.117, "dur": 176.458, + "args": { + "External id": 229163,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115479931.735, "dur": 0.618, + "args": { + "External id": 229164,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115479933.428, "dur": 22.136, + "args": { + "External id": 229165,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115479957.110, "dur": 5.179, + "args": { + "External id": 229166,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115479961.038, "dur": 0.964, + "args": { + "External id": 229167,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115479963.042, "dur": 21.125, + "args": { + "External id": 229168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115479964.329, "dur": 1.642, + "args": { + "External id": 229169,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115479967.064, "dur": 16.802, + "args": { + "External id": 229170,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115479969.387, "dur": 2.328, + "args": { + "External id": 229171,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115479985.674, "dur": 21.199, + "args": { + "External id": 229172,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115480008.370, "dur": 13.253, + "args": { + "External id": 229173,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115480024.160, "dur": 14.069, + "args": { + "External id": 229174,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115480039.749, "dur": 13.149, + "args": { + "External id": 229175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115480054.559, "dur": 23.237, + "args": { + "External id": 229176,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115480058.776, "dur": 1.383, + "args": { + "External id": 229177,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480062.668, "dur": 1.343, + "args": { + "External id": 229178,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115480079.480, "dur": 13.058, + "args": { + "External id": 229179,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115480094.034, "dur": 11.388, + "args": { + "External id": 229180,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115480113.339, "dur": 1.640, + "args": { + "External id": 229181,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115480122.770, "dur": 3.542, + "args": { + "External id": 229182,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480124.709, "dur": 0.746, + "args": { + "External id": 229183,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115480190.461, "dur": 41.746, + "args": { + "External id": 229184,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115480236.996, "dur": 4.540, + "args": { + "External id": 229185,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480239.291, "dur": 1.232, + "args": { + "External id": 229186,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115480242.734, "dur": 23.804, + "args": { + "External id": 229187,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115480271.060, "dur": 5.579, + "args": { + "External id": 229188,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115480272.616, "dur": 3.426, + "args": { + "External id": 229189,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480274.425, "dur": 1.420, + "args": { + "External id": 229190,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115480278.735, "dur": 41.814, + "args": { + "External id": 229191,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115480279.861, "dur": 40.032, + "args": { + "External id": 229192,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115480324.255, "dur": 14.477, + "args": { + "External id": 229193,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115480344.005, "dur": 3.761, + "args": { + "External id": 229194,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480346.217, "dur": 0.712, + "args": { + "External id": 229195,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115480351.256, "dur": 47.536, + "args": { + "External id": 229196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115480352.166, "dur": 4.474, + "args": { + "External id": 229197,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115480352.856, "dur": 3.271, + "args": { + "External id": 229198,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480354.658, "dur": 1.346, + "args": { + "External id": 229199,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115480357.228, "dur": 41.281, + "args": { + "External id": 229200,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115480357.904, "dur": 40.026, + "args": { + "External id": 229201,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115480402.443, "dur": 3.779, + "args": { + "External id": 229202,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480404.425, "dur": 0.757, + "args": { + "External id": 229203,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115480410.991, "dur": 1.470, + "args": { + "External id": 229204,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115480419.256, "dur": 7.139, + "args": { + "External id": 229205,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115480421.874, "dur": 4.177, + "args": { + "External id": 229206,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115480523.123, "dur": 222.823, + "args": { + "External id": 229207,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115480527.768, "dur": 2.926, + "args": { + "External id": 229208,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115480532.623, "dur": 212.852, + "args": { + "External id": 229209,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115480533.981, "dur": 0.351, + "args": { + "External id": 229210,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115480535.417, "dur": 22.145, + "args": { + "External id": 229211,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115480558.970, "dur": 5.378, + "args": { + "External id": 229212,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480562.821, "dur": 1.251, + "args": { + "External id": 229213,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115480565.313, "dur": 20.587, + "args": { + "External id": 229214,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115480566.275, "dur": 1.244, + "args": { + "External id": 229215,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115480568.689, "dur": 16.950, + "args": { + "External id": 229216,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115480570.941, "dur": 2.206, + "args": { + "External id": 229217,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115480587.387, "dur": 19.502, + "args": { + "External id": 229218,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115480608.324, "dur": 16.319, + "args": { + "External id": 229219,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115480627.456, "dur": 15.669, + "args": { + "External id": 229220,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115480644.349, "dur": 46.385, + "args": { + "External id": 229221,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115480693.937, "dur": 23.907, + "args": { + "External id": 229222,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115480696.085, "dur": 2.091, + "args": { + "External id": 229223,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480700.768, "dur": 0.963, + "args": { + "External id": 229224,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115480719.555, "dur": 12.372, + "args": { + "External id": 229225,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115480733.455, "dur": 11.060, + "args": { + "External id": 229226,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115480753.539, "dur": 2.478, + "args": { + "External id": 229227,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115480765.277, "dur": 3.778, + "args": { + "External id": 229228,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480767.646, "dur": 0.631, + "args": { + "External id": 229229,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115480840.201, "dur": 52.632, + "args": { + "External id": 229230,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115480897.346, "dur": 4.200, + "args": { + "External id": 229231,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480899.872, "dur": 0.769, + "args": { + "External id": 229232,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115480903.005, "dur": 28.547, + "args": { + "External id": 229233,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115480936.262, "dur": 6.555, + "args": { + "External id": 229234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115480937.918, "dur": 4.067, + "args": { + "External id": 229235,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115480940.324, "dur": 1.466, + "args": { + "External id": 229236,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115480945.258, "dur": 70.749, + "args": { + "External id": 229237,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115480946.678, "dur": 68.679, + "args": { + "External id": 229238,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115481019.261, "dur": 36.188, + "args": { + "External id": 229239,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115481061.072, "dur": 4.108, + "args": { + "External id": 229240,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481063.471, "dur": 0.783, + "args": { + "External id": 229241,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115481068.880, "dur": 60.473, + "args": { + "External id": 229242,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115481069.852, "dur": 4.021, + "args": { + "External id": 229243,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115481070.661, "dur": 2.656, + "args": { + "External id": 229244,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481072.519, "dur": 0.654, + "args": { + "External id": 229245,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115481074.604, "dur": 54.417, + "args": { + "External id": 229246,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115481075.353, "dur": 53.044, + "args": { + "External id": 229247,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115481133.299, "dur": 3.926, + "args": { + "External id": 229248,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481135.418, "dur": 0.744, + "args": { + "External id": 229249,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115481142.141, "dur": 1.492, + "args": { + "External id": 229250,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481150.620, "dur": 8.101, + "args": { + "External id": 229251,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481152.946, "dur": 5.442, + "args": { + "External id": 229252,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115481235.084, "dur": 162.054, + "args": { + "External id": 229253,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481236.814, "dur": 2.187, + "args": { + "External id": 229254,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115481240.463, "dur": 156.166, + "args": { + "External id": 229255,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115481241.837, "dur": 0.318, + "args": { + "External id": 229256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115481243.530, "dur": 21.105, + "args": { + "External id": 229257,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115481266.162, "dur": 3.708, + "args": { + "External id": 229258,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481268.440, "dur": 1.186, + "args": { + "External id": 229259,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115481270.859, "dur": 21.368, + "args": { + "External id": 229260,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481271.704, "dur": 1.757, + "args": { + "External id": 229261,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115481274.537, "dur": 17.254, + "args": { + "External id": 229262,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115481279.097, "dur": 2.244, + "args": { + "External id": 229263,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115481293.682, "dur": 19.037, + "args": { + "External id": 229264,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115481314.106, "dur": 11.638, + "args": { + "External id": 229265,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115481327.859, "dur": 12.636, + "args": { + "External id": 229266,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115481341.599, "dur": 11.139, + "args": { + "External id": 229267,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115481354.343, "dur": 17.818, + "args": { + "External id": 229268,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115481355.783, "dur": 1.238, + "args": { + "External id": 229269,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481359.408, "dur": 0.919, + "args": { + "External id": 229270,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115481373.622, "dur": 10.315, + "args": { + "External id": 229271,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115481384.871, "dur": 10.705, + "args": { + "External id": 229272,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115481402.367, "dur": 1.396, + "args": { + "External id": 229273,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115481410.915, "dur": 3.427, + "args": { + "External id": 229274,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481413.186, "dur": 0.403, + "args": { + "External id": 229275,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115481471.191, "dur": 55.472, + "args": { + "External id": 229276,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115481543.650, "dur": 8.279, + "args": { + "External id": 229277,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481547.122, "dur": 3.296, + "args": { + "External id": 229278,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115481553.262, "dur": 22.746, + "args": { + "External id": 229279,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115481581.808, "dur": 5.277, + "args": { + "External id": 229280,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115481583.328, "dur": 3.118, + "args": { + "External id": 229281,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481585.352, "dur": 0.914, + "args": { + "External id": 229282,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115481589.562, "dur": 45.373, + "args": { + "External id": 229283,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115481590.825, "dur": 43.405, + "args": { + "External id": 229284,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115481638.424, "dur": 47.488, + "args": { + "External id": 229285,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115481694.312, "dur": 5.446, + "args": { + "External id": 229286,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481697.170, "dur": 1.098, + "args": { + "External id": 229287,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115481704.046, "dur": 53.507, + "args": { + "External id": 229288,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115481705.102, "dur": 4.243, + "args": { + "External id": 229289,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115481705.964, "dur": 2.818, + "args": { + "External id": 229290,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481707.820, "dur": 0.821, + "args": { + "External id": 229291,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115481710.153, "dur": 47.049, + "args": { + "External id": 229292,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115481711.158, "dur": 45.270, + "args": { + "External id": 229293,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115481761.432, "dur": 4.183, + "args": { + "External id": 229294,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481763.537, "dur": 0.892, + "args": { + "External id": 229295,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115481772.032, "dur": 1.864, + "args": { + "External id": 229296,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481781.577, "dur": 7.095, + "args": { + "External id": 229297,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481783.783, "dur": 4.631, + "args": { + "External id": 229298,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115481881.370, "dur": 186.244, + "args": { + "External id": 229299,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481883.901, "dur": 4.370, + "args": { + "External id": 229300,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115481889.913, "dur": 177.138, + "args": { + "External id": 229301,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115481891.737, "dur": 0.494, + "args": { + "External id": 229302,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115481893.427, "dur": 22.177, + "args": { + "External id": 229303,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115481917.317, "dur": 5.801, + "args": { + "External id": 229304,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115481922.146, "dur": 0.723, + "args": { + "External id": 229305,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115481924.128, "dur": 20.080, + "args": { + "External id": 229306,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115481924.971, "dur": 1.692, + "args": { + "External id": 229307,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115481927.741, "dur": 16.157, + "args": { + "External id": 229308,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115481930.523, "dur": 2.569, + "args": { + "External id": 229309,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115481945.883, "dur": 19.157, + "args": { + "External id": 229310,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115481966.529, "dur": 12.762, + "args": { + "External id": 229311,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115481982.016, "dur": 22.850, + "args": { + "External id": 229312,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115482006.439, "dur": 11.588, + "args": { + "External id": 229313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115482019.646, "dur": 21.313, + "args": { + "External id": 229314,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115482021.887, "dur": 1.500, + "args": { + "External id": 229315,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482025.770, "dur": 2.746, + "args": { + "External id": 229316,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115482042.950, "dur": 11.317, + "args": { + "External id": 229317,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115482055.296, "dur": 10.546, + "args": { + "External id": 229318,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115482073.698, "dur": 1.914, + "args": { + "External id": 229319,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115482084.218, "dur": 3.305, + "args": { + "External id": 229320,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482086.276, "dur": 0.409, + "args": { + "External id": 229321,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115482151.784, "dur": 40.591, + "args": { + "External id": 229322,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115482196.666, "dur": 5.411, + "args": { + "External id": 229323,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482199.759, "dur": 1.306, + "args": { + "External id": 229324,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115482203.319, "dur": 20.310, + "args": { + "External id": 229325,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115482228.195, "dur": 5.958, + "args": { + "External id": 229326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115482229.975, "dur": 3.388, + "args": { + "External id": 229327,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482231.714, "dur": 1.471, + "args": { + "External id": 229328,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115482236.418, "dur": 40.237, + "args": { + "External id": 229329,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115482237.602, "dur": 38.522, + "args": { + "External id": 229330,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115482279.826, "dur": 13.207, + "args": { + "External id": 229331,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115482297.413, "dur": 23.703, + "args": { + "External id": 229332,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115482299.862, "dur": 20.821, + "args": { + "External id": 229333,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482304.960, "dur": 0.999, + "args": { + "External id": 229334,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115482325.868, "dur": 25.059, + "args": { + "External id": 229335,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115482327.677, "dur": 23.045, + "args": { + "External id": 229336,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 8135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482331.949, "dur": 3.797, + "args": { + "External id": 229337,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115482336.845, "dur": 13.298, + "args": { + "External id": 229338,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115482363.031, "dur": 4.941, + "args": { + "External id": 229339,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115482365.061, "dur": 2.687, + "args": { + "External id": 229340,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115482369.074, "dur": 1.414, + "args": { + "External id": 229341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115482369.937, "dur": 0.476, + "args": { + "External id": 229342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115482412.236, "dur": 22.499, + "args": { + "External id": 229343,"Sequence number": 2757948, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115482436.978, "dur": 14.890, + "args": { + "External id": 229344,"Sequence number": 2757949, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8143 + } + }, + { + "ph": "s", "id": 9, "pid": 4183442, "tid": 4183442, "ts": 667115482436.978, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115482457.396, "dur": 5.529, + "args": { + "External id": 229345,"Sequence number": 2757950, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 8144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482460.629, "dur": 0.971, + "args": { + "External id": 229346,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115482465.334, "dur": 7.003, + "args": { + "External id": 229347,"Sequence number": 2757950, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "3"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 8146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482469.918, "dur": 1.161, + "args": { + "External id": 229348,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115482473.640, "dur": 3.360, + "args": { + "External id": 229349,"Sequence number": 2757950, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 8148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482475.408, "dur": 0.994, + "args": { + "External id": 229350,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 8149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115482481.086, "dur": 7.285, + "args": { + "External id": 229351,"Sequence number": 2757950, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 8150 + } + }, + { + "ph": "s", "id": 8, "pid": 4183442, "tid": 4183442, "ts": 667115482481.086, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482486.162, "dur": 0.984, + "args": { + "External id": 229352,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 8151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115482489.522, "dur": 24.795, + "args": { + "External id": 229353,"Sequence number": 2757951, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 8152 + } + }, + { + "ph": "s", "id": 7, "pid": 4183442, "tid": 4183442, "ts": 667115482489.522, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482511.851, "dur": 0.836, + "args": { + "External id": 229354,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 8153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183442, "tid": 4183442, + "ts": 667115482515.917, "dur": 5.586, + "args": { + "External id": 229355,"Sequence number": 2757952, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 8154 + } + }, + { + "ph": "s", "id": 6, "pid": 4183442, "tid": 4183442, "ts": 667115482515.917, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482519.770, "dur": 0.837, + "args": { + "External id": 229356,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 8155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115482522.674, "dur": 5.186, + "args": { + "External id": 229357,"Sequence number": 2757953, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 8156 + } + }, + { + "ph": "s", "id": 5, "pid": 4183442, "tid": 4183442, "ts": 667115482522.674, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482525.781, "dur": 1.322, + "args": { + "External id": 229358,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 8157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115482532.326, "dur": 33.398, + "args": { + "External id": 229359,"Sequence number": 2757954, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115482533.977, "dur": 31.464, + "args": { + "External id": 229360,"Sequence number": 2757954, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115482536.603, "dur": 6.568, + "args": { + "External id": 229361,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 8160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115482539.023, "dur": 3.639, + "args": { + "External id": 229362,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115482544.104, "dur": 20.786, + "args": { + "External id": 229363,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 8162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115482591.892, "dur": 6.331, + "args": { + "External id": 229364,"Sequence number": 2757954, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 8163 + } + }, + { + "ph": "s", "id": 4, "pid": 4183442, "tid": 4183442, "ts": 667115482591.892, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115482600.578, "dur": 1.357, + "args": { + "External id": 229365,"Sequence number": 2757955, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183442, "tid": 4183442, + "ts": 667115482633.507, "dur": 23083.083, + "args": { + "External id": 229366,"Sequence number": 2757955, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 8165 + } + }, + { + "ph": "s", "id": 3, "pid": 4183442, "tid": 4183442, "ts": 667115482633.507, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183442, "tid": 4183442, + "ts": 667115482647.733, "dur": 70.943, + "args": { + "External id": 229367,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 8166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115482648.566, "dur": 69.881, + "args": { + "External id": 229368,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 8167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115482650.164, "dur": 43.632, + "args": { + "External id": 229369,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 8168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115482687.236, "dur": 5.783, + "args": { + "External id": 229370,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115482694.655, "dur": 23.392, + "args": { + "External id": 229371,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 8170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115482736.009, "dur": 28.570, + "args": { + "External id": 229372,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 8171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115482737.391, "dur": 6.736, + "args": { + "External id": 229373,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 8172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482739.827, "dur": 3.940, + "args": { + "External id": 229374,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115482745.417, "dur": 18.943, + "args": { + "External id": 229375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115482747.339, "dur": 16.501, + "args": { + "External id": 229376,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 8175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183442, "tid": 4183442, + "ts": 667115482795.714, "dur": 18.990, + "args": { + "External id": 229377,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115482796.367, "dur": 4.894, + "args": { + "External id": 229378,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482798.240, "dur": 2.791, + "args": { + "External id": 229379,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115482801.823, "dur": 12.687, + "args": { + "External id": 229380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115482802.198, "dur": 11.883, + "args": { + "External id": 229381,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 8180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115482821.104, "dur": 18.017, + "args": { + "External id": 229382,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115482824.916, "dur": 2.750, + "args": { + "External id": 229383,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115482828.234, "dur": 10.619, + "args": { + "External id": 229384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 8183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115482828.801, "dur": 9.648, + "args": { + "External id": 229385,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 4183442, + "ts": 667115482844.154, "dur": 21.928, + "args": { + "External id": 229386,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115482868.888, "dur": 50.718, + "args": { + "External id": 229387,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115482870.862, "dur": 48.258, + "args": { + "External id": 229388,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482875.639, "dur": 1.115, + "args": { + "External id": 229389,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115482878.191, "dur": 23.942, + "args": { + "External id": 229390,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115482879.812, "dur": 22.121, + "args": { + "External id": 229391,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 8190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115482883.793, "dur": 2.251, + "args": { + "External id": 229392,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115482886.725, "dur": 14.839, + "args": { + "External id": 229393,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 8192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 4183442, + "ts": 667115482923.513, "dur": 17376.544, + "args": { + "External id": 229394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 4183442, + "ts": 667115482924.793, "dur": 17373.808, + "args": { + "External id": 229395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115500311.420, "dur": 8.299, + "args": { + "External id": 229396,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115500316.860, "dur": 0.901, + "args": { + "External id": 229397,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115500324.573, "dur": 103.090, + "args": { + "External id": 229398,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115500326.180, "dur": 7.245, + "args": { + "External id": 229399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115500328.519, "dur": 3.937, + "args": { + "External id": 229400,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115500330.907, "dur": 1.234, + "args": { + "External id": 229401,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115500334.613, "dur": 92.402, + "args": { + "External id": 229402,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115500336.144, "dur": 89.730, + "args": { + "External id": 229403,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115500431.369, "dur": 4.676, + "args": { + "External id": 229404,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115500433.547, "dur": 0.865, + "args": { + "External id": 229405,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115500442.733, "dur": 2.826, + "args": { + "External id": 229406,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115500458.523, "dur": 6.807, + "args": { + "External id": 229407,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115500460.914, "dur": 4.131, + "args": { + "External id": 229408,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115500600.199, "dur": 239.157, + "args": { + "External id": 229409,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115500605.270, "dur": 2.869, + "args": { + "External id": 229410,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115500610.207, "dur": 228.680, + "args": { + "External id": 229411,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115500612.151, "dur": 0.648, + "args": { + "External id": 229412,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115500614.551, "dur": 27.475, + "args": { + "External id": 229413,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115500643.673, "dur": 6.154, + "args": { + "External id": 229414,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115500648.305, "dur": 1.148, + "args": { + "External id": 229415,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115500651.078, "dur": 55.508, + "args": { + "External id": 229416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115500679.867, "dur": 2.733, + "args": { + "External id": 229417,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115500684.162, "dur": 22.131, + "args": { + "External id": 229418,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115500688.083, "dur": 3.342, + "args": { + "External id": 229419,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115500708.566, "dur": 23.760, + "args": { + "External id": 229420,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115500734.150, "dur": 18.508, + "args": { + "External id": 229421,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115500755.541, "dur": 15.826, + "args": { + "External id": 229422,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115500773.125, "dur": 14.401, + "args": { + "External id": 229423,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115500789.353, "dur": 22.831, + "args": { + "External id": 229424,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115500791.891, "dur": 1.768, + "args": { + "External id": 229425,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115500796.211, "dur": 0.962, + "args": { + "External id": 229426,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115500813.818, "dur": 12.387, + "args": { + "External id": 229427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115500827.566, "dur": 10.310, + "args": { + "External id": 229428,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115500847.446, "dur": 2.474, + "args": { + "External id": 229429,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115500857.219, "dur": 4.443, + "args": { + "External id": 229430,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115500859.840, "dur": 0.890, + "args": { + "External id": 229431,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115500935.831, "dur": 54.568, + "args": { + "External id": 229432,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115500995.779, "dur": 14.138, + "args": { + "External id": 229433,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501005.351, "dur": 1.762, + "args": { + "External id": 229434,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115501011.881, "dur": 25.465, + "args": { + "External id": 229435,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115501042.529, "dur": 9.718, + "args": { + "External id": 229436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115501044.446, "dur": 6.974, + "args": { + "External id": 229437,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501046.910, "dur": 4.221, + "args": { + "External id": 229438,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115501055.173, "dur": 44.919, + "args": { + "External id": 229439,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115501056.376, "dur": 43.016, + "args": { + "External id": 229440,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115501104.501, "dur": 14.147, + "args": { + "External id": 229441,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115501124.308, "dur": 4.086, + "args": { + "External id": 229442,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501126.680, "dur": 0.796, + "args": { + "External id": 229443,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115501132.624, "dur": 47.684, + "args": { + "External id": 229444,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115501133.927, "dur": 4.128, + "args": { + "External id": 229445,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115501134.719, "dur": 2.639, + "args": { + "External id": 229446,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501136.273, "dur": 0.734, + "args": { + "External id": 229447,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115501138.713, "dur": 41.225, + "args": { + "External id": 229448,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115501139.515, "dur": 39.844, + "args": { + "External id": 229449,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115501184.644, "dur": 4.021, + "args": { + "External id": 229450,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501186.523, "dur": 0.608, + "args": { + "External id": 229451,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115501194.676, "dur": 1.571, + "args": { + "External id": 229452,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115501203.906, "dur": 6.854, + "args": { + "External id": 229453,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115501206.048, "dur": 4.439, + "args": { + "External id": 229454,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115501296.396, "dur": 170.092, + "args": { + "External id": 229455,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115501298.734, "dur": 2.282, + "args": { + "External id": 229456,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115501304.722, "dur": 161.180, + "args": { + "External id": 229457,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115501306.258, "dur": 0.513, + "args": { + "External id": 229458,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115501308.148, "dur": 19.289, + "args": { + "External id": 229459,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115501328.868, "dur": 5.323, + "args": { + "External id": 229460,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501331.235, "dur": 2.706, + "args": { + "External id": 229461,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115501334.998, "dur": 21.255, + "args": { + "External id": 229462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115501336.440, "dur": 1.697, + "args": { + "External id": 229463,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115501339.310, "dur": 16.684, + "args": { + "External id": 229464,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115501341.611, "dur": 2.729, + "args": { + "External id": 229465,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115501357.780, "dur": 18.999, + "args": { + "External id": 229466,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115501378.211, "dur": 11.727, + "args": { + "External id": 229467,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115501392.444, "dur": 13.789, + "args": { + "External id": 229468,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115501407.462, "dur": 11.728, + "args": { + "External id": 229469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115501420.769, "dur": 19.720, + "args": { + "External id": 229470,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115501422.929, "dur": 1.670, + "args": { + "External id": 229471,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501426.959, "dur": 0.708, + "args": { + "External id": 229472,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115501441.983, "dur": 10.666, + "args": { + "External id": 229473,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115501453.642, "dur": 11.458, + "args": { + "External id": 229474,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115501472.723, "dur": 1.740, + "args": { + "External id": 229475,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115501482.581, "dur": 3.660, + "args": { + "External id": 229476,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501484.863, "dur": 0.505, + "args": { + "External id": 229477,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115501582.307, "dur": 53.920, + "args": { + "External id": 229478,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115501641.890, "dur": 7.806, + "args": { + "External id": 229479,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501644.971, "dur": 3.098, + "args": { + "External id": 229480,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115501684.073, "dur": 29.050, + "args": { + "External id": 229481,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115501728.456, "dur": 7.377, + "args": { + "External id": 229482,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115501731.749, "dur": 3.056, + "args": { + "External id": 229483,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501733.689, "dur": 0.885, + "args": { + "External id": 229484,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115501738.995, "dur": 52.264, + "args": { + "External id": 229485,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115501740.316, "dur": 50.302, + "args": { + "External id": 229486,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115501795.323, "dur": 16.102, + "args": { + "External id": 229487,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115501818.021, "dur": 4.424, + "args": { + "External id": 229488,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501820.652, "dur": 0.771, + "args": { + "External id": 229489,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115501826.754, "dur": 49.514, + "args": { + "External id": 229490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115501827.893, "dur": 4.603, + "args": { + "External id": 229491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115501828.998, "dur": 2.923, + "args": { + "External id": 229492,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501830.711, "dur": 1.008, + "args": { + "External id": 229493,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115501833.050, "dur": 42.786, + "args": { + "External id": 229494,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115501833.674, "dur": 41.621, + "args": { + "External id": 229495,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115501880.310, "dur": 3.916, + "args": { + "External id": 229496,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115501882.283, "dur": 0.838, + "args": { + "External id": 229497,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115501890.423, "dur": 2.033, + "args": { + "External id": 229498,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115501900.169, "dur": 8.620, + "args": { + "External id": 229499,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115501902.408, "dur": 5.998, + "args": { + "External id": 229500,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115501997.067, "dur": 183.422, + "args": { + "External id": 229501,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115501999.264, "dur": 2.341, + "args": { + "External id": 229502,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115502003.259, "dur": 176.750, + "args": { + "External id": 229503,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115502004.965, "dur": 0.388, + "args": { + "External id": 229504,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115502006.678, "dur": 24.328, + "args": { + "External id": 229505,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115502032.775, "dur": 3.297, + "args": { + "External id": 229506,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502035.153, "dur": 0.738, + "args": { + "External id": 229507,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115502036.929, "dur": 22.889, + "args": { + "External id": 229508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115502038.267, "dur": 2.150, + "args": { + "External id": 229509,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115502041.682, "dur": 17.863, + "args": { + "External id": 229510,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115502046.575, "dur": 2.332, + "args": { + "External id": 229511,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115502064.307, "dur": 19.150, + "args": { + "External id": 229512,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115502084.796, "dur": 12.889, + "args": { + "External id": 229513,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115502100.174, "dur": 13.635, + "args": { + "External id": 229514,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115502115.379, "dur": 13.286, + "args": { + "External id": 229515,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115502130.371, "dur": 20.981, + "args": { + "External id": 229516,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115502132.491, "dur": 1.857, + "args": { + "External id": 229517,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502136.533, "dur": 0.773, + "args": { + "External id": 229518,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115502153.075, "dur": 13.934, + "args": { + "External id": 229519,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115502168.256, "dur": 10.729, + "args": { + "External id": 229520,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115502187.091, "dur": 2.050, + "args": { + "External id": 229521,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115502197.966, "dur": 3.556, + "args": { + "External id": 229522,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502200.234, "dur": 0.414, + "args": { + "External id": 229523,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115502263.384, "dur": 40.633, + "args": { + "External id": 229524,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115502308.416, "dur": 6.395, + "args": { + "External id": 229525,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502310.746, "dur": 3.058, + "args": { + "External id": 229526,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115502316.212, "dur": 20.976, + "args": { + "External id": 229527,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115502341.891, "dur": 5.489, + "args": { + "External id": 229528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115502343.296, "dur": 3.387, + "args": { + "External id": 229529,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502345.588, "dur": 0.905, + "args": { + "External id": 229530,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115502349.614, "dur": 41.156, + "args": { + "External id": 229531,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115502350.267, "dur": 39.893, + "args": { + "External id": 229532,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115502394.447, "dur": 14.684, + "args": { + "External id": 229533,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115502414.591, "dur": 4.087, + "args": { + "External id": 229534,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502416.867, "dur": 1.010, + "args": { + "External id": 229535,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115502422.087, "dur": 50.220, + "args": { + "External id": 229536,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115502423.062, "dur": 3.485, + "args": { + "External id": 229537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115502423.752, "dur": 2.250, + "args": { + "External id": 229538,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502425.120, "dur": 0.731, + "args": { + "External id": 229539,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115502427.084, "dur": 44.887, + "args": { + "External id": 229540,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115502427.715, "dur": 43.625, + "args": { + "External id": 229541,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115502476.351, "dur": 3.571, + "args": { + "External id": 229542,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502478.009, "dur": 0.950, + "args": { + "External id": 229543,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115502484.957, "dur": 1.500, + "args": { + "External id": 229544,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115502511.632, "dur": 8.541, + "args": { + "External id": 229545,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115502514.035, "dur": 5.663, + "args": { + "External id": 229546,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115502605.575, "dur": 222.440, + "args": { + "External id": 229547,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115502607.262, "dur": 4.523, + "args": { + "External id": 229548,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115502613.296, "dur": 214.131, + "args": { + "External id": 229549,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115502614.532, "dur": 0.347, + "args": { + "External id": 229550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115502616.628, "dur": 21.454, + "args": { + "External id": 229551,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115502639.698, "dur": 6.419, + "args": { + "External id": 229552,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502644.327, "dur": 1.523, + "args": { + "External id": 229553,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115502647.094, "dur": 58.237, + "args": { + "External id": 229554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115502648.154, "dur": 1.403, + "args": { + "External id": 229555,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115502650.714, "dur": 54.144, + "args": { + "External id": 229556,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115502687.207, "dur": 3.276, + "args": { + "External id": 229557,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115502706.902, "dur": 21.313, + "args": { + "External id": 229558,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115502729.597, "dur": 13.939, + "args": { + "External id": 229559,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115502746.520, "dur": 14.607, + "args": { + "External id": 229560,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115502762.446, "dur": 12.473, + "args": { + "External id": 229561,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115502776.638, "dur": 24.016, + "args": { + "External id": 229562,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115502780.728, "dur": 1.807, + "args": { + "External id": 229563,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502785.252, "dur": 0.953, + "args": { + "External id": 229564,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115502802.311, "dur": 12.237, + "args": { + "External id": 229565,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115502815.966, "dur": 10.261, + "args": { + "External id": 229566,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115502835.560, "dur": 2.745, + "args": { + "External id": 229567,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115502847.540, "dur": 3.868, + "args": { + "External id": 229568,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502849.906, "dur": 0.684, + "args": { + "External id": 229569,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115502914.607, "dur": 46.740, + "args": { + "External id": 229570,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115502966.362, "dur": 4.257, + "args": { + "External id": 229571,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115502968.982, "dur": 0.680, + "args": { + "External id": 229572,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115502972.025, "dur": 21.491, + "args": { + "External id": 229573,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115502998.070, "dur": 6.118, + "args": { + "External id": 229574,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115502999.678, "dur": 3.793, + "args": { + "External id": 229575,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503001.800, "dur": 1.474, + "args": { + "External id": 229576,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115503006.997, "dur": 41.296, + "args": { + "External id": 229577,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115503008.018, "dur": 39.565, + "args": { + "External id": 229578,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115503051.855, "dur": 13.457, + "args": { + "External id": 229579,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115503070.959, "dur": 4.006, + "args": { + "External id": 229580,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503073.443, "dur": 0.804, + "args": { + "External id": 229581,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115503078.525, "dur": 46.131, + "args": { + "External id": 229582,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115503079.549, "dur": 3.818, + "args": { + "External id": 229583,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115503080.131, "dur": 2.664, + "args": { + "External id": 229584,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503081.942, "dur": 0.701, + "args": { + "External id": 229585,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115503083.921, "dur": 40.362, + "args": { + "External id": 229586,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115503084.635, "dur": 39.069, + "args": { + "External id": 229587,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115503128.747, "dur": 4.208, + "args": { + "External id": 229588,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503130.825, "dur": 0.972, + "args": { + "External id": 229589,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115503137.660, "dur": 1.387, + "args": { + "External id": 229590,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503146.481, "dur": 6.306, + "args": { + "External id": 229591,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503149.019, "dur": 3.504, + "args": { + "External id": 229592,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115503224.602, "dur": 170.771, + "args": { + "External id": 229593,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503228.333, "dur": 2.252, + "args": { + "External id": 229594,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115503232.133, "dur": 162.733, + "args": { + "External id": 229595,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115503233.160, "dur": 0.512, + "args": { + "External id": 229596,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115503235.206, "dur": 20.362, + "args": { + "External id": 229597,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115503257.137, "dur": 4.691, + "args": { + "External id": 229598,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503260.550, "dur": 1.098, + "args": { + "External id": 229599,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115503262.718, "dur": 18.837, + "args": { + "External id": 229600,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503263.920, "dur": 1.516, + "args": { + "External id": 229601,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115503266.598, "dur": 14.699, + "args": { + "External id": 229602,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115503268.802, "dur": 2.332, + "args": { + "External id": 229603,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115503282.819, "dur": 18.834, + "args": { + "External id": 229604,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115503303.062, "dur": 15.877, + "args": { + "External id": 229605,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115503321.506, "dur": 12.973, + "args": { + "External id": 229606,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115503335.662, "dur": 10.463, + "args": { + "External id": 229607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115503347.633, "dur": 17.364, + "args": { + "External id": 229608,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115503349.266, "dur": 1.535, + "args": { + "External id": 229609,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503352.943, "dur": 0.789, + "args": { + "External id": 229610,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115503366.796, "dur": 15.536, + "args": { + "External id": 229611,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115503383.336, "dur": 10.539, + "args": { + "External id": 229612,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115503400.743, "dur": 1.292, + "args": { + "External id": 229613,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115503409.790, "dur": 3.175, + "args": { + "External id": 229614,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503411.777, "dur": 0.450, + "args": { + "External id": 229615,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115503467.822, "dur": 54.185, + "args": { + "External id": 229616,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115503527.932, "dur": 6.243, + "args": { + "External id": 229617,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503531.275, "dur": 1.207, + "args": { + "External id": 229618,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115503535.249, "dur": 21.358, + "args": { + "External id": 229619,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115503561.306, "dur": 5.892, + "args": { + "External id": 229620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115503562.611, "dur": 3.694, + "args": { + "External id": 229621,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503565.004, "dur": 1.110, + "args": { + "External id": 229622,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115503569.697, "dur": 45.299, + "args": { + "External id": 229623,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115503571.114, "dur": 43.176, + "args": { + "External id": 229624,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115503618.585, "dur": 14.806, + "args": { + "External id": 229625,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115503638.981, "dur": 4.357, + "args": { + "External id": 229626,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503641.531, "dur": 0.923, + "args": { + "External id": 229627,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115503647.001, "dur": 87.527, + "args": { + "External id": 229628,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115503647.928, "dur": 36.874, + "args": { + "External id": 229629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115503648.995, "dur": 34.969, + "args": { + "External id": 229630,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503682.140, "dur": 1.179, + "args": { + "External id": 229631,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115503686.119, "dur": 47.913, + "args": { + "External id": 229632,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115503687.344, "dur": 45.959, + "args": { + "External id": 229633,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115503740.130, "dur": 4.396, + "args": { + "External id": 229634,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503742.597, "dur": 0.710, + "args": { + "External id": 229635,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115503750.801, "dur": 1.586, + "args": { + "External id": 229636,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503759.433, "dur": 9.530, + "args": { + "External id": 229637,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503762.237, "dur": 6.436, + "args": { + "External id": 229638,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115503850.020, "dur": 181.276, + "args": { + "External id": 229639,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503851.906, "dur": 2.281, + "args": { + "External id": 229640,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115503855.616, "dur": 175.010, + "args": { + "External id": 229641,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115503857.114, "dur": 0.473, + "args": { + "External id": 229642,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115503858.702, "dur": 24.736, + "args": { + "External id": 229643,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115503885.113, "dur": 3.447, + "args": { + "External id": 229644,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503887.343, "dur": 0.971, + "args": { + "External id": 229645,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115503889.510, "dur": 24.235, + "args": { + "External id": 229646,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115503890.857, "dur": 1.532, + "args": { + "External id": 229647,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115503893.794, "dur": 19.637, + "args": { + "External id": 229648,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115503898.763, "dur": 2.290, + "args": { + "External id": 229649,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115503915.204, "dur": 20.676, + "args": { + "External id": 229650,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115503937.554, "dur": 12.893, + "args": { + "External id": 229651,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115503952.946, "dur": 14.612, + "args": { + "External id": 229652,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115503968.964, "dur": 12.715, + "args": { + "External id": 229653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115503983.744, "dur": 20.690, + "args": { + "External id": 229654,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115503985.490, "dur": 1.965, + "args": { + "External id": 229655,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115503989.534, "dur": 0.987, + "args": { + "External id": 229656,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115504005.855, "dur": 11.704, + "args": { + "External id": 229657,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115504018.672, "dur": 10.721, + "args": { + "External id": 229658,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115504036.562, "dur": 1.378, + "args": { + "External id": 229659,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115504059.973, "dur": 3.337, + "args": { + "External id": 229660,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504062.013, "dur": 0.549, + "args": { + "External id": 229661,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115504123.334, "dur": 44.984, + "args": { + "External id": 229662,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115504173.057, "dur": 6.719, + "args": { + "External id": 229663,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504175.861, "dur": 2.843, + "args": { + "External id": 229664,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115504181.016, "dur": 24.246, + "args": { + "External id": 229665,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115504209.294, "dur": 5.693, + "args": { + "External id": 229666,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115504210.896, "dur": 3.342, + "args": { + "External id": 229667,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504213.093, "dur": 0.735, + "args": { + "External id": 229668,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115504217.275, "dur": 43.000, + "args": { + "External id": 229669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115504218.448, "dur": 41.152, + "args": { + "External id": 229670,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115504263.662, "dur": 15.265, + "args": { + "External id": 229671,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115504284.331, "dur": 4.265, + "args": { + "External id": 229672,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504286.764, "dur": 0.952, + "args": { + "External id": 229673,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115504292.046, "dur": 48.601, + "args": { + "External id": 229674,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115504293.258, "dur": 3.849, + "args": { + "External id": 229675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115504294.005, "dur": 2.532, + "args": { + "External id": 229676,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504295.736, "dur": 0.446, + "args": { + "External id": 229677,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115504297.811, "dur": 42.504, + "args": { + "External id": 229678,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115504298.577, "dur": 41.156, + "args": { + "External id": 229679,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115504344.425, "dur": 3.941, + "args": { + "External id": 229680,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504346.420, "dur": 0.975, + "args": { + "External id": 229681,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115504353.192, "dur": 1.316, + "args": { + "External id": 229682,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115504360.948, "dur": 6.010, + "args": { + "External id": 229683,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115504362.696, "dur": 3.912, + "args": { + "External id": 229684,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115504441.001, "dur": 304.527, + "args": { + "External id": 229685,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115504443.159, "dur": 4.053, + "args": { + "External id": 229686,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115504448.628, "dur": 296.362, + "args": { + "External id": 229687,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115504449.949, "dur": 0.643, + "args": { + "External id": 229688,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115504451.857, "dur": 26.405, + "args": { + "External id": 229689,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115504479.895, "dur": 5.195, + "args": { + "External id": 229690,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504484.178, "dur": 0.763, + "args": { + "External id": 229691,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115504485.895, "dur": 42.968, + "args": { + "External id": 229692,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115504486.917, "dur": 1.559, + "args": { + "External id": 229693,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115504489.523, "dur": 39.019, + "args": { + "External id": 229694,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115504509.624, "dur": 3.237, + "args": { + "External id": 229695,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115504530.469, "dur": 38.681, + "args": { + "External id": 229696,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115504570.622, "dur": 37.335, + "args": { + "External id": 229697,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115504610.430, "dur": 26.745, + "args": { + "External id": 229698,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115504638.835, "dur": 45.563, + "args": { + "External id": 229699,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115504687.424, "dur": 27.921, + "args": { + "External id": 229700,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115504692.041, "dur": 1.885, + "args": { + "External id": 229701,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504696.392, "dur": 0.903, + "args": { + "External id": 229702,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115504717.456, "dur": 13.341, + "args": { + "External id": 229703,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115504731.934, "dur": 11.538, + "args": { + "External id": 229704,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115504752.574, "dur": 2.519, + "args": { + "External id": 229705,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115504765.299, "dur": 3.764, + "args": { + "External id": 229706,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504767.742, "dur": 0.411, + "args": { + "External id": 229707,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115504837.723, "dur": 48.131, + "args": { + "External id": 229708,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115504890.483, "dur": 4.979, + "args": { + "External id": 229709,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504893.290, "dur": 1.177, + "args": { + "External id": 229710,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115504896.879, "dur": 22.997, + "args": { + "External id": 229711,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115504924.721, "dur": 6.596, + "args": { + "External id": 229712,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115504926.658, "dur": 3.920, + "args": { + "External id": 229713,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115504928.824, "dur": 1.528, + "args": { + "External id": 229714,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115504933.883, "dur": 43.826, + "args": { + "External id": 229715,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115504935.544, "dur": 41.539, + "args": { + "External id": 229716,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115504981.532, "dur": 13.585, + "args": { + "External id": 229717,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115505000.723, "dur": 4.306, + "args": { + "External id": 229718,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505003.354, "dur": 0.892, + "args": { + "External id": 229719,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183442, "tid": 4183442, + "ts": 667115505008.886, "dur": 47.327, + "args": { + "External id": 229720,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115505010.094, "dur": 3.884, + "args": { + "External id": 229721,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115505011.184, "dur": 2.232, + "args": { + "External id": 229722,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505012.634, "dur": 0.648, + "args": { + "External id": 229723,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115505014.676, "dur": 41.191, + "args": { + "External id": 229724,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115505016.111, "dur": 39.128, + "args": { + "External id": 229725,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115505060.091, "dur": 4.351, + "args": { + "External id": 229726,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505062.178, "dur": 1.051, + "args": { + "External id": 229727,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115505069.800, "dur": 1.282, + "args": { + "External id": 229728,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183442, "tid": 4183442, + "ts": 667115505078.241, "dur": 6.325, + "args": { + "External id": 229729,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115505080.368, "dur": 3.878, + "args": { + "External id": 229730,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115505158.797, "dur": 168.076, + "args": { + "External id": 229731,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115505162.794, "dur": 2.418, + "args": { + "External id": 229732,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183442, "tid": 4183442, + "ts": 667115505166.781, "dur": 159.691, + "args": { + "External id": 229733,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183442, "tid": 4183442, + "ts": 667115505168.207, "dur": 0.497, + "args": { + "External id": 229734,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183442, "tid": 4183442, + "ts": 667115505170.162, "dur": 19.096, + "args": { + "External id": 229735,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183442, "tid": 4183442, + "ts": 667115505190.802, "dur": 5.116, + "args": { + "External id": 229736,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505194.450, "dur": 1.270, + "args": { + "External id": 229737,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115505196.910, "dur": 20.631, + "args": { + "External id": 229738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115505197.952, "dur": 1.457, + "args": { + "External id": 229739,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115505200.860, "dur": 16.435, + "args": { + "External id": 229740,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115505203.150, "dur": 2.175, + "args": { + "External id": 229741,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115505219.157, "dur": 20.288, + "args": { + "External id": 229742,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115505241.123, "dur": 13.691, + "args": { + "External id": 229743,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183442, "tid": 4183442, + "ts": 667115505257.390, "dur": 12.844, + "args": { + "External id": 229744,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183442, "tid": 4183442, + "ts": 667115505271.744, "dur": 10.456, + "args": { + "External id": 229745,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115505283.780, "dur": 17.691, + "args": { + "External id": 229746,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115505285.725, "dur": 1.533, + "args": { + "External id": 229747,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505289.455, "dur": 0.896, + "args": { + "External id": 229748,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183442, "tid": 4183442, + "ts": 667115505303.107, "dur": 11.069, + "args": { + "External id": 229749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115505315.464, "dur": 10.033, + "args": { + "External id": 229750,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115505332.192, "dur": 1.553, + "args": { + "External id": 229751,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115505340.802, "dur": 3.467, + "args": { + "External id": 229752,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505343.103, "dur": 0.322, + "args": { + "External id": 229753,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115505403.226, "dur": 38.783, + "args": { + "External id": 229754,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183442, "tid": 4183442, + "ts": 667115505446.262, "dur": 12.874, + "args": { + "External id": 229755,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505457.028, "dur": 1.003, + "args": { + "External id": 229756,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115505460.468, "dur": 20.947, + "args": { + "External id": 229757,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183442, "tid": 4183442, + "ts": 667115505485.469, "dur": 25.726, + "args": { + "External id": 229758,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183442, "tid": 4183442, + "ts": 667115505486.989, "dur": 23.009, + "args": { + "External id": 229759,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505488.770, "dur": 20.545, + "args": { + "External id": 229760,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183442, "tid": 4183442, + "ts": 667115505515.206, "dur": 46.661, + "args": { + "External id": 229761,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183442, "tid": 4183442, + "ts": 667115505516.532, "dur": 44.632, + "args": { + "External id": 229762,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115505565.574, "dur": 14.332, + "args": { + "External id": 229763,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115505584.965, "dur": 24.581, + "args": { + "External id": 229764,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183442, "tid": 4183442, + "ts": 667115505587.126, "dur": 22.060, + "args": { + "External id": 229765,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505592.952, "dur": 1.662, + "args": { + "External id": 229766,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115505614.865, "dur": 24.716, + "args": { + "External id": 229767,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183442, "tid": 4183442, + "ts": 667115505616.590, "dur": 22.784, + "args": { + "External id": 229768,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 8567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115505621.496, "dur": 3.649, + "args": { + "External id": 229769,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115505626.242, "dur": 12.649, + "args": { + "External id": 229770,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115505683.482, "dur": 5.744, + "args": { + "External id": 229771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115505685.425, "dur": 3.348, + "args": { + "External id": 229772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183442, "tid": 4183442, + "ts": 667115505690.784, "dur": 1.719, + "args": { + "External id": 229773,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183442, "tid": 4183442, + "ts": 667115505691.886, "dur": 0.534, + "args": { + "External id": 229774,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115505733.969, "dur": 24.654, + "args": { + "External id": 229775,"Sequence number": 2757956, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183442, "tid": 4183442, + "ts": 667115505760.535, "dur": 12.515, + "args": { + "External id": 229776,"Sequence number": 2757957, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8575 + } + }, + { + "ph": "s", "id": 2, "pid": 4183442, "tid": 4183442, "ts": 667115505760.535, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward", "pid": 4183442, "tid": 4183442, + "ts": 667115505880.388, "dur": 41.974, + "args": { + "External id": 229777,"Record function id": 0, "Ev Idx": 8576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183442, "tid": 4183442, + "ts": 667115506024.577, "dur": 35.606, + "args": { + "External id": 229778,"Sequence number": 2757958, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8577 + } + }, + { + "ph": "s", "id": 1, "pid": 4183442, "tid": 4183442, "ts": 667115506024.577, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ones_like", "pid": 4183442, "tid": 4183442, + "ts": 667115506119.407, "dur": 27.151, + "args": { + "External id": 229779,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 8578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115506120.860, "dur": 8.563, + "args": { + "External id": 229780,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 8579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115506124.720, "dur": 3.982, + "args": { + "External id": 229781,"Record function id": 0, "Concrete Inputs": ["[1]", "[1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115506131.177, "dur": 15.109, + "args": { + "External id": 229782,"Record function id": 0, "Concrete Inputs": ["", "1."], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183442, "tid": 4183442, + "ts": 667115955631.504, "dur": 77.003, + "args": { + "External id": 229783,"Sequence number": 2757959, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183442, "tid": 4183442, + "ts": 667115955718.937, "dur": 22.481, + "args": { + "External id": 229784,"Sequence number": 2757960, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115955861.848, "dur": 23.596, + "args": { + "External id": 229785,"Sequence number": 2757961, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115956355.401, "dur": 20.141, + "args": { + "External id": 229786,"Sequence number": 2757962, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 8585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115956381.456, "dur": 13.196, + "args": { + "External id": 229787,"Sequence number": 2757963, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 4183442, "tid": 4183442, + "ts": 667115958118.297, "dur": 2428.006, + "args": { + "External id": 229788,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 8587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 4183442, "tid": 4183442, + "ts": 667115958621.295, "dur": 697.866, + "args": { + "External id": 229789,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 8588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183442, "tid": 4183442, + "ts": 667115958639.045, "dur": 86.940, + "args": { + "External id": 229790,"Record function id": 0, "Concrete Inputs": ["[13797]", "6", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115958642.363, "dur": 11.738, + "args": { + "External id": 229791,"Record function id": 0, "Concrete Inputs": ["[13797]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183442, "tid": 4183442, + "ts": 667115958682.274, "dur": 43.269, + "args": { + "External id": 229792,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[13797]], "Ev Idx": 8591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183442, "tid": 4183442, + "ts": 667115958685.471, "dur": 39.495, + "args": { + "External id": 229793,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[13797], []], "Ev Idx": 8592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960573.835, "dur": 2.874, + "args": { + "External id": 229794,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960578.889, "dur": 0.340, + "args": { + "External id": 229795,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960580.374, "dur": 0.375, + "args": { + "External id": 229796,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960582.314, "dur": 0.410, + "args": { + "External id": 229797,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960583.725, "dur": 0.427, + "args": { + "External id": 229798,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960585.696, "dur": 0.357, + "args": { + "External id": 229799,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960587.089, "dur": 0.410, + "args": { + "External id": 229800,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960589.709, "dur": 0.271, + "args": { + "External id": 229801,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960590.918, "dur": 0.396, + "args": { + "External id": 229802,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960592.469, "dur": 0.229, + "args": { + "External id": 229803,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960593.602, "dur": 0.238, + "args": { + "External id": 229804,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960594.881, "dur": 0.370, + "args": { + "External id": 229805,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960596.071, "dur": 0.416, + "args": { + "External id": 229806,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960597.535, "dur": 0.344, + "args": { + "External id": 229807,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960598.763, "dur": 0.395, + "args": { + "External id": 229808,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960601.166, "dur": 0.441, + "args": { + "External id": 229809,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960602.613, "dur": 0.260, + "args": { + "External id": 229810,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960603.832, "dur": 0.221, + "args": { + "External id": 229811,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960604.991, "dur": 0.255, + "args": { + "External id": 229812,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960606.125, "dur": 0.214, + "args": { + "External id": 229813,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960607.146, "dur": 0.246, + "args": { + "External id": 229814,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960608.211, "dur": 0.579, + "args": { + "External id": 229815,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960609.660, "dur": 0.339, + "args": { + "External id": 229816,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960612.339, "dur": 0.356, + "args": { + "External id": 229817,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960613.704, "dur": 0.285, + "args": { + "External id": 229818,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960615.152, "dur": 0.237, + "args": { + "External id": 229819,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960616.462, "dur": 0.255, + "args": { + "External id": 229820,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960617.736, "dur": 0.214, + "args": { + "External id": 229821,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960618.832, "dur": 0.348, + "args": { + "External id": 229822,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960620.009, "dur": 0.322, + "args": { + "External id": 229823,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960621.200, "dur": 0.305, + "args": { + "External id": 229824,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960623.600, "dur": 0.216, + "args": { + "External id": 229825,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960624.690, "dur": 0.231, + "args": { + "External id": 229826,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960626.149, "dur": 0.214, + "args": { + "External id": 229827,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960627.318, "dur": 0.250, + "args": { + "External id": 229828,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960628.411, "dur": 0.218, + "args": { + "External id": 229829,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960629.533, "dur": 0.228, + "args": { + "External id": 229830,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960630.625, "dur": 0.226, + "args": { + "External id": 229831,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960631.789, "dur": 0.220, + "args": { + "External id": 229832,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960634.320, "dur": 0.221, + "args": { + "External id": 229833,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960635.387, "dur": 0.216, + "args": { + "External id": 229834,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960636.679, "dur": 0.226, + "args": { + "External id": 229835,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960637.810, "dur": 0.221, + "args": { + "External id": 229836,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960639.030, "dur": 0.248, + "args": { + "External id": 229837,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960640.102, "dur": 0.238, + "args": { + "External id": 229838,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960641.157, "dur": 0.215, + "args": { + "External id": 229839,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960642.222, "dur": 0.215, + "args": { + "External id": 229840,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960645.539, "dur": 0.260, + "args": { + "External id": 229841,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960646.648, "dur": 0.217, + "args": { + "External id": 229842,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960647.724, "dur": 0.215, + "args": { + "External id": 229843,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960648.754, "dur": 0.218, + "args": { + "External id": 229844,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960649.788, "dur": 0.319, + "args": { + "External id": 229845,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960650.925, "dur": 0.293, + "args": { + "External id": 229846,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960652.301, "dur": 0.307, + "args": { + "External id": 229847,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960678.014, "dur": 1.096, + "args": { + "External id": 229848,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960683.677, "dur": 0.339, + "args": { + "External id": 229849,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960684.982, "dur": 0.338, + "args": { + "External id": 229850,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960686.258, "dur": 0.215, + "args": { + "External id": 229851,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960687.274, "dur": 0.339, + "args": { + "External id": 229852,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960688.560, "dur": 0.276, + "args": { + "External id": 229853,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960689.802, "dur": 0.340, + "args": { + "External id": 229854,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960691.040, "dur": 0.378, + "args": { + "External id": 229855,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960692.537, "dur": 0.220, + "args": { + "External id": 229856,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960695.373, "dur": 0.303, + "args": { + "External id": 229857,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960696.466, "dur": 0.369, + "args": { + "External id": 229858,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960697.993, "dur": 0.215, + "args": { + "External id": 229859,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960699.237, "dur": 0.242, + "args": { + "External id": 229860,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960700.504, "dur": 0.309, + "args": { + "External id": 229861,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960701.744, "dur": 0.216, + "args": { + "External id": 229862,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960702.921, "dur": 0.217, + "args": { + "External id": 229863,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960703.921, "dur": 0.240, + "args": { + "External id": 229864,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960706.910, "dur": 0.349, + "args": { + "External id": 229865,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960708.232, "dur": 0.332, + "args": { + "External id": 229866,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960709.402, "dur": 0.230, + "args": { + "External id": 229867,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960710.448, "dur": 0.349, + "args": { + "External id": 229868,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960711.574, "dur": 0.218, + "args": { + "External id": 229869,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960712.585, "dur": 0.215, + "args": { + "External id": 229870,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960714.292, "dur": 0.240, + "args": { + "External id": 229871,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960715.370, "dur": 0.209, + "args": { + "External id": 229872,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960717.631, "dur": 0.206, + "args": { + "External id": 229873,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960718.801, "dur": 0.209, + "args": { + "External id": 229874,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960719.805, "dur": 0.207, + "args": { + "External id": 229875,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960720.863, "dur": 0.205, + "args": { + "External id": 229876,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960721.864, "dur": 0.227, + "args": { + "External id": 229877,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960722.857, "dur": 0.206, + "args": { + "External id": 229878,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960724.050, "dur": 0.204, + "args": { + "External id": 229879,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960725.063, "dur": 0.242, + "args": { + "External id": 229880,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960727.224, "dur": 0.207, + "args": { + "External id": 229881,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960728.319, "dur": 0.220, + "args": { + "External id": 229882,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960729.320, "dur": 0.208, + "args": { + "External id": 229883,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960730.292, "dur": 0.205, + "args": { + "External id": 229884,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960731.320, "dur": 0.230, + "args": { + "External id": 229885,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960732.338, "dur": 0.232, + "args": { + "External id": 229886,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960734.388, "dur": 0.236, + "args": { + "External id": 229887,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960735.404, "dur": 0.341, + "args": { + "External id": 229888,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960761.800, "dur": 0.241, + "args": { + "External id": 234497,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960763.190, "dur": 0.204, + "args": { + "External id": 234498,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960764.219, "dur": 0.226, + "args": { + "External id": 234499,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960765.227, "dur": 0.218, + "args": { + "External id": 234500,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960766.236, "dur": 0.207, + "args": { + "External id": 234501,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960767.300, "dur": 0.205, + "args": { + "External id": 234502,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960768.278, "dur": 0.210, + "args": { + "External id": 234503,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960769.276, "dur": 0.211, + "args": { + "External id": 234504,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960772.031, "dur": 0.208, + "args": { + "External id": 234505,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960773.109, "dur": 0.205, + "args": { + "External id": 234506,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960774.103, "dur": 0.208, + "args": { + "External id": 234507,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960775.101, "dur": 0.206, + "args": { + "External id": 234508,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960776.159, "dur": 0.210, + "args": { + "External id": 234509,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960777.212, "dur": 0.208, + "args": { + "External id": 234510,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960778.856, "dur": 0.220, + "args": { + "External id": 234511,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960779.879, "dur": 0.210, + "args": { + "External id": 234512,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960782.122, "dur": 0.206, + "args": { + "External id": 234513,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960783.240, "dur": 0.228, + "args": { + "External id": 234514,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960784.283, "dur": 0.231, + "args": { + "External id": 234515,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960785.293, "dur": 0.229, + "args": { + "External id": 234516,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960786.386, "dur": 0.208, + "args": { + "External id": 234517,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960787.472, "dur": 0.206, + "args": { + "External id": 234518,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960788.521, "dur": 0.209, + "args": { + "External id": 234519,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960793.183, "dur": 0.212, + "args": { + "External id": 234520,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960795.779, "dur": 0.215, + "args": { + "External id": 234521,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960797.022, "dur": 0.214, + "args": { + "External id": 234522,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960798.043, "dur": 0.215, + "args": { + "External id": 234523,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960799.052, "dur": 0.215, + "args": { + "External id": 234524,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960800.085, "dur": 0.217, + "args": { + "External id": 234525,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960801.134, "dur": 0.214, + "args": { + "External id": 234526,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960802.113, "dur": 0.216, + "args": { + "External id": 234527,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960803.248, "dur": 0.220, + "args": { + "External id": 234528,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960806.086, "dur": 0.215, + "args": { + "External id": 234529,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960807.120, "dur": 0.216, + "args": { + "External id": 234530,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960809.009, "dur": 0.240, + "args": { + "External id": 234531,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960810.121, "dur": 0.214, + "args": { + "External id": 234532,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960811.128, "dur": 0.210, + "args": { + "External id": 234533,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960812.151, "dur": 0.216, + "args": { + "External id": 234534,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960813.147, "dur": 0.215, + "args": { + "External id": 234535,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960814.139, "dur": 0.212, + "args": { + "External id": 234536,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960816.723, "dur": 0.211, + "args": { + "External id": 234537,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960817.759, "dur": 0.209, + "args": { + "External id": 234538,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960818.760, "dur": 0.211, + "args": { + "External id": 234539,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960819.763, "dur": 0.213, + "args": { + "External id": 234540,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960820.774, "dur": 0.213, + "args": { + "External id": 234541,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960821.776, "dur": 0.235, + "args": { + "External id": 234542,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960822.868, "dur": 0.210, + "args": { + "External id": 234543,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960824.014, "dur": 0.207, + "args": { + "External id": 234544,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960826.576, "dur": 0.213, + "args": { + "External id": 234545,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960827.562, "dur": 0.212, + "args": { + "External id": 234546,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960828.565, "dur": 0.209, + "args": { + "External id": 234547,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960829.587, "dur": 0.211, + "args": { + "External id": 234548,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960830.571, "dur": 0.209, + "args": { + "External id": 234549,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960831.552, "dur": 0.232, + "args": { + "External id": 234550,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960832.983, "dur": 0.224, + "args": { + "External id": 234551,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960834.000, "dur": 0.229, + "args": { + "External id": 234552,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960836.340, "dur": 0.214, + "args": { + "External id": 234553,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960837.337, "dur": 0.208, + "args": { + "External id": 234554,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960838.416, "dur": 0.213, + "args": { + "External id": 234555,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960839.420, "dur": 0.213, + "args": { + "External id": 234556,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960840.451, "dur": 0.211, + "args": { + "External id": 234557,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960841.478, "dur": 0.212, + "args": { + "External id": 234558,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960842.522, "dur": 0.214, + "args": { + "External id": 234559,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960843.558, "dur": 0.211, + "args": { + "External id": 234560,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960845.932, "dur": 0.214, + "args": { + "External id": 234561,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960846.977, "dur": 0.224, + "args": { + "External id": 234562,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960850.020, "dur": 0.213, + "args": { + "External id": 234563,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960851.133, "dur": 0.219, + "args": { + "External id": 234564,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960852.232, "dur": 0.211, + "args": { + "External id": 234565,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960853.279, "dur": 0.228, + "args": { + "External id": 234566,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960854.365, "dur": 0.212, + "args": { + "External id": 234567,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960855.408, "dur": 0.221, + "args": { + "External id": 234568,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960857.392, "dur": 0.208, + "args": { + "External id": 234569,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960858.426, "dur": 0.221, + "args": { + "External id": 234570,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960859.440, "dur": 0.211, + "args": { + "External id": 234571,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960860.502, "dur": 0.214, + "args": { + "External id": 234572,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960861.624, "dur": 0.209, + "args": { + "External id": 234573,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960862.636, "dur": 0.215, + "args": { + "External id": 234574,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960864.085, "dur": 0.254, + "args": { + "External id": 234575,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960865.123, "dur": 0.209, + "args": { + "External id": 234576,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960867.652, "dur": 0.244, + "args": { + "External id": 234577,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960868.732, "dur": 0.220, + "args": { + "External id": 234578,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960869.737, "dur": 0.210, + "args": { + "External id": 234579,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960870.865, "dur": 0.234, + "args": { + "External id": 234580,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960871.940, "dur": 0.213, + "args": { + "External id": 234581,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960872.938, "dur": 0.211, + "args": { + "External id": 234582,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960873.946, "dur": 0.212, + "args": { + "External id": 234583,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960875.005, "dur": 0.211, + "args": { + "External id": 234584,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960876.948, "dur": 0.212, + "args": { + "External id": 234585,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960877.948, "dur": 0.208, + "args": { + "External id": 234586,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960878.978, "dur": 0.209, + "args": { + "External id": 234587,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960879.964, "dur": 0.207, + "args": { + "External id": 234588,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960880.953, "dur": 0.211, + "args": { + "External id": 234589,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960881.939, "dur": 0.225, + "args": { + "External id": 234590,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960882.945, "dur": 0.207, + "args": { + "External id": 234591,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960883.927, "dur": 0.209, + "args": { + "External id": 234592,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960886.565, "dur": 0.206, + "args": { + "External id": 234593,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960887.544, "dur": 0.208, + "args": { + "External id": 234594,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960888.531, "dur": 0.208, + "args": { + "External id": 234595,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960889.528, "dur": 0.207, + "args": { + "External id": 234596,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960890.523, "dur": 0.230, + "args": { + "External id": 234597,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960891.556, "dur": 0.209, + "args": { + "External id": 234598,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960892.582, "dur": 0.206, + "args": { + "External id": 234599,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960893.596, "dur": 0.208, + "args": { + "External id": 234600,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960896.176, "dur": 0.209, + "args": { + "External id": 234601,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960897.175, "dur": 0.209, + "args": { + "External id": 234602,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960898.576, "dur": 0.222, + "args": { + "External id": 234603,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960899.654, "dur": 0.209, + "args": { + "External id": 234604,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960906.717, "dur": 0.228, + "args": { + "External id": 234605,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960907.894, "dur": 0.243, + "args": { + "External id": 234606,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960908.933, "dur": 0.234, + "args": { + "External id": 234607,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960910.027, "dur": 0.209, + "args": { + "External id": 234608,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960912.107, "dur": 0.209, + "args": { + "External id": 234609,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960913.114, "dur": 0.207, + "args": { + "External id": 234610,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960914.096, "dur": 0.230, + "args": { + "External id": 234611,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960915.144, "dur": 0.214, + "args": { + "External id": 234612,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960916.136, "dur": 0.206, + "args": { + "External id": 234613,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960917.152, "dur": 0.205, + "args": { + "External id": 234614,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960918.153, "dur": 0.205, + "args": { + "External id": 234615,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960919.123, "dur": 0.206, + "args": { + "External id": 234616,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960921.056, "dur": 0.206, + "args": { + "External id": 234617,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960922.033, "dur": 0.227, + "args": { + "External id": 234618,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960923.054, "dur": 0.207, + "args": { + "External id": 234619,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115960924.089, "dur": 0.211, + "args": { + "External id": 234620,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 4183442, "tid": 4183442, + "ts": 667115960968.495, "dur": 1144.954, + "args": { + "External id": 234621,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 4183442, "tid": 4183442, + "ts": 667115961315.120, "dur": 733.300, + "args": { + "External id": 234622,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961321.071, "dur": 6.542, + "args": { + "External id": 234623,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961324.603, "dur": 2.661, + "args": { + "External id": 234624,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961328.202, "dur": 4.262, + "args": { + "External id": 234625,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961329.473, "dur": 2.862, + "args": { + "External id": 234626,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961332.864, "dur": 2.007, + "args": { + "External id": 234627,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961334.204, "dur": 0.601, + "args": { + "External id": 234628,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961335.210, "dur": 1.253, + "args": { + "External id": 234629,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961335.617, "dur": 0.780, + "args": { + "External id": 234630,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961338.262, "dur": 4.388, + "args": { + "External id": 234631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961342.044, "dur": 0.538, + "args": { + "External id": 234632,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961342.966, "dur": 0.950, + "args": { + "External id": 234633,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961343.415, "dur": 0.432, + "args": { + "External id": 234634,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961344.179, "dur": 1.094, + "args": { + "External id": 234635,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961344.566, "dur": 0.640, + "args": { + "External id": 234636,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961345.513, "dur": 5.456, + "args": { + "External id": 234637,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961350.397, "dur": 0.507, + "args": { + "External id": 234638,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961351.196, "dur": 1.259, + "args": { + "External id": 234639,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961351.717, "dur": 0.671, + "args": { + "External id": 234640,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961352.840, "dur": 3.056, + "args": { + "External id": 234641,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961353.213, "dur": 2.613, + "args": { + "External id": 234642,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961356.145, "dur": 2.553, + "args": { + "External id": 234643,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961357.869, "dur": 0.767, + "args": { + "External id": 234644,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961358.930, "dur": 1.374, + "args": { + "External id": 234645,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961359.309, "dur": 0.926, + "args": { + "External id": 234646,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961362.660, "dur": 5.148, + "args": { + "External id": 234647,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961366.794, "dur": 0.944, + "args": { + "External id": 234648,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961368.072, "dur": 1.007, + "args": { + "External id": 234649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961368.439, "dur": 0.579, + "args": { + "External id": 234650,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961369.399, "dur": 1.296, + "args": { + "External id": 234651,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961369.773, "dur": 0.856, + "args": { + "External id": 234652,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961370.922, "dur": 3.646, + "args": { + "External id": 234653,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961373.781, "dur": 0.722, + "args": { + "External id": 234654,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961374.995, "dur": 1.307, + "args": { + "External id": 234655,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961375.395, "dur": 0.847, + "args": { + "External id": 234656,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961376.529, "dur": 3.768, + "args": { + "External id": 234657,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961376.896, "dur": 3.330, + "args": { + "External id": 234658,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961380.540, "dur": 2.886, + "args": { + "External id": 234659,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961382.406, "dur": 0.954, + "args": { + "External id": 234660,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961383.674, "dur": 1.151, + "args": { + "External id": 234661,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961384.037, "dur": 0.723, + "args": { + "External id": 234662,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961386.388, "dur": 4.732, + "args": { + "External id": 234663,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961390.475, "dur": 0.582, + "args": { + "External id": 234664,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961391.364, "dur": 1.280, + "args": { + "External id": 234665,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961391.726, "dur": 0.853, + "args": { + "External id": 234666,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961393.068, "dur": 1.026, + "args": { + "External id": 234667,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961393.427, "dur": 0.601, + "args": { + "External id": 234668,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961394.315, "dur": 3.082, + "args": { + "External id": 234669,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961396.757, "dur": 0.578, + "args": { + "External id": 234670,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961397.621, "dur": 1.165, + "args": { + "External id": 234671,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961398.027, "dur": 0.678, + "args": { + "External id": 234672,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961399.024, "dur": 3.196, + "args": { + "External id": 234673,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961399.398, "dur": 2.740, + "args": { + "External id": 234674,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961402.480, "dur": 2.553, + "args": { + "External id": 234675,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961404.299, "dur": 0.670, + "args": { + "External id": 234676,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961405.413, "dur": 1.487, + "args": { + "External id": 234677,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961405.798, "dur": 0.838, + "args": { + "External id": 234678,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961407.947, "dur": 4.157, + "args": { + "External id": 234679,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961411.475, "dur": 0.565, + "args": { + "External id": 234680,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961412.357, "dur": 1.243, + "args": { + "External id": 234681,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961412.729, "dur": 0.798, + "args": { + "External id": 234682,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961413.855, "dur": 1.171, + "args": { + "External id": 234683,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961414.240, "dur": 0.720, + "args": { + "External id": 234684,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961415.250, "dur": 3.302, + "args": { + "External id": 234685,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961417.853, "dur": 0.636, + "args": { + "External id": 234686,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961418.781, "dur": 1.067, + "args": { + "External id": 234687,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961419.144, "dur": 0.643, + "args": { + "External id": 234688,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961420.073, "dur": 3.680, + "args": { + "External id": 234689,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961420.434, "dur": 2.951, + "args": { + "External id": 234690,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961423.979, "dur": 2.733, + "args": { + "External id": 234691,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961425.808, "dur": 0.832, + "args": { + "External id": 234692,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961427.384, "dur": 1.299, + "args": { + "External id": 234693,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961427.943, "dur": 0.672, + "args": { + "External id": 234694,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961429.209, "dur": 4.190, + "args": { + "External id": 234695,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961432.552, "dur": 0.785, + "args": { + "External id": 234696,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961433.675, "dur": 1.113, + "args": { + "External id": 234697,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961434.057, "dur": 0.668, + "args": { + "External id": 234698,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961435.245, "dur": 1.377, + "args": { + "External id": 234699,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961435.657, "dur": 0.896, + "args": { + "External id": 234700,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961437.107, "dur": 3.511, + "args": { + "External id": 234701,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961439.620, "dur": 0.933, + "args": { + "External id": 234702,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961440.945, "dur": 1.162, + "args": { + "External id": 234703,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961441.308, "dur": 0.733, + "args": { + "External id": 234704,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961442.605, "dur": 3.456, + "args": { + "External id": 234705,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961442.971, "dur": 3.017, + "args": { + "External id": 234706,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961446.319, "dur": 1.664, + "args": { + "External id": 234707,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961446.900, "dur": 1.019, + "args": { + "External id": 234708,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961448.228, "dur": 1.225, + "args": { + "External id": 234709,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961448.599, "dur": 0.788, + "args": { + "External id": 234710,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961449.882, "dur": 3.222, + "args": { + "External id": 234711,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961452.425, "dur": 0.611, + "args": { + "External id": 234712,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961453.384, "dur": 0.908, + "args": { + "External id": 234713,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961453.741, "dur": 0.490, + "args": { + "External id": 234714,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961454.539, "dur": 1.066, + "args": { + "External id": 234715,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961454.910, "dur": 0.629, + "args": { + "External id": 234716,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961455.903, "dur": 3.172, + "args": { + "External id": 234717,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961458.307, "dur": 0.707, + "args": { + "External id": 234718,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961459.319, "dur": 1.056, + "args": { + "External id": 234719,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961459.692, "dur": 0.619, + "args": { + "External id": 234720,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961460.739, "dur": 3.125, + "args": { + "External id": 234721,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961461.131, "dur": 2.653, + "args": { + "External id": 234722,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961464.305, "dur": 1.325, + "args": { + "External id": 234723,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961465.062, "dur": 0.506, + "args": { + "External id": 234724,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961465.880, "dur": 1.178, + "args": { + "External id": 234725,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961466.255, "dur": 0.735, + "args": { + "External id": 234726,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961467.317, "dur": 3.155, + "args": { + "External id": 234727,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961469.786, "dur": 0.622, + "args": { + "External id": 234728,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961470.735, "dur": 1.050, + "args": { + "External id": 234729,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961471.124, "dur": 0.597, + "args": { + "External id": 234730,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961472.232, "dur": 1.207, + "args": { + "External id": 234731,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961472.644, "dur": 0.728, + "args": { + "External id": 234732,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961473.689, "dur": 3.128, + "args": { + "External id": 234733,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961475.960, "dur": 0.792, + "args": { + "External id": 234734,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961477.098, "dur": 1.013, + "args": { + "External id": 234735,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961477.460, "dur": 0.590, + "args": { + "External id": 234736,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961478.357, "dur": 3.331, + "args": { + "External id": 234737,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961478.735, "dur": 2.882, + "args": { + "External id": 234738,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961481.934, "dur": 1.934, + "args": { + "External id": 234739,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961482.823, "dur": 0.985, + "args": { + "External id": 234740,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961484.116, "dur": 1.114, + "args": { + "External id": 234741,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961484.477, "dur": 0.686, + "args": { + "External id": 234742,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961485.873, "dur": 3.995, + "args": { + "External id": 234743,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961489.117, "dur": 0.687, + "args": { + "External id": 234744,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961490.142, "dur": 1.236, + "args": { + "External id": 234745,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961490.512, "dur": 0.806, + "args": { + "External id": 234746,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961491.639, "dur": 15.876, + "args": { + "External id": 234747,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961506.322, "dur": 0.877, + "args": { + "External id": 234748,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961507.900, "dur": 2.908, + "args": { + "External id": 234749,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961510.255, "dur": 0.492, + "args": { + "External id": 234750,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961511.082, "dur": 1.021, + "args": { + "External id": 234751,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961511.502, "dur": 0.538, + "args": { + "External id": 234752,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961512.370, "dur": 2.835, + "args": { + "External id": 234753,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961512.740, "dur": 2.395, + "args": { + "External id": 234754,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961515.505, "dur": 1.391, + "args": { + "External id": 234755,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961516.075, "dur": 0.757, + "args": { + "External id": 234756,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961517.155, "dur": 1.192, + "args": { + "External id": 234757,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961517.539, "dur": 0.741, + "args": { + "External id": 234758,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961518.621, "dur": 2.908, + "args": { + "External id": 234759,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961520.986, "dur": 0.477, + "args": { + "External id": 234760,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961521.809, "dur": 1.114, + "args": { + "External id": 234761,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961522.171, "dur": 0.689, + "args": { + "External id": 234762,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961523.209, "dur": 1.246, + "args": { + "External id": 234763,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961523.599, "dur": 0.789, + "args": { + "External id": 234764,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961524.734, "dur": 2.955, + "args": { + "External id": 234765,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961527.101, "dur": 0.524, + "args": { + "External id": 234766,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961527.949, "dur": 1.207, + "args": { + "External id": 234767,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961528.334, "dur": 0.762, + "args": { + "External id": 234768,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961529.414, "dur": 2.866, + "args": { + "External id": 234769,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961529.777, "dur": 2.431, + "args": { + "External id": 234770,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961532.543, "dur": 1.342, + "args": { + "External id": 234771,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961533.156, "dur": 0.665, + "args": { + "External id": 234772,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961534.188, "dur": 1.157, + "args": { + "External id": 234773,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961534.551, "dur": 0.732, + "args": { + "External id": 234774,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961535.720, "dur": 3.022, + "args": { + "External id": 234775,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961538.150, "dur": 0.529, + "args": { + "External id": 234776,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961539.055, "dur": 1.114, + "args": { + "External id": 234777,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961539.427, "dur": 0.682, + "args": { + "External id": 234778,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961540.427, "dur": 1.158, + "args": { + "External id": 234779,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961540.789, "dur": 0.729, + "args": { + "External id": 234780,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961541.860, "dur": 3.015, + "args": { + "External id": 234781,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961544.078, "dur": 0.737, + "args": { + "External id": 234782,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961545.156, "dur": 1.620, + "args": { + "External id": 234783,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961545.532, "dur": 1.178, + "args": { + "External id": 234784,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961547.031, "dur": 2.943, + "args": { + "External id": 234785,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961547.396, "dur": 2.511, + "args": { + "External id": 234786,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961550.236, "dur": 1.218, + "args": { + "External id": 234787,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961550.676, "dur": 0.717, + "args": { + "External id": 234788,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961551.883, "dur": 1.233, + "args": { + "External id": 234789,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961552.243, "dur": 0.806, + "args": { + "External id": 234790,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961553.399, "dur": 3.301, + "args": { + "External id": 234791,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961556.090, "dur": 0.546, + "args": { + "External id": 234792,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961556.972, "dur": 1.213, + "args": { + "External id": 234793,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961557.343, "dur": 0.779, + "args": { + "External id": 234794,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961558.440, "dur": 1.146, + "args": { + "External id": 234795,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961558.803, "dur": 0.721, + "args": { + "External id": 234796,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961560.105, "dur": 3.267, + "args": { + "External id": 234797,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961562.415, "dur": 0.891, + "args": { + "External id": 234798,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961563.826, "dur": 1.043, + "args": { + "External id": 234799,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961564.196, "dur": 0.604, + "args": { + "External id": 234800,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961565.300, "dur": 2.560, + "args": { + "External id": 234801,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961565.669, "dur": 2.118, + "args": { + "External id": 234802,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961568.150, "dur": 1.354, + "args": { + "External id": 234803,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961568.817, "dur": 0.626, + "args": { + "External id": 234804,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961569.916, "dur": 1.148, + "args": { + "External id": 234805,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961570.294, "dur": 0.705, + "args": { + "External id": 234806,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961571.344, "dur": 3.834, + "args": { + "External id": 234807,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961574.517, "dur": 0.597, + "args": { + "External id": 234808,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961575.540, "dur": 1.071, + "args": { + "External id": 234809,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961575.913, "dur": 0.639, + "args": { + "External id": 234810,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961577.009, "dur": 1.067, + "args": { + "External id": 234811,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961577.370, "dur": 0.637, + "args": { + "External id": 234812,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961578.367, "dur": 3.287, + "args": { + "External id": 234813,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961580.847, "dur": 0.747, + "args": { + "External id": 234814,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961581.912, "dur": 1.415, + "args": { + "External id": 234815,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961582.314, "dur": 0.951, + "args": { + "External id": 234816,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961583.580, "dur": 2.687, + "args": { + "External id": 234817,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961583.940, "dur": 2.254, + "args": { + "External id": 234818,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961586.518, "dur": 1.347, + "args": { + "External id": 234819,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961587.179, "dur": 0.623, + "args": { + "External id": 234820,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961588.121, "dur": 1.258, + "args": { + "External id": 234821,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961588.536, "dur": 0.778, + "args": { + "External id": 234822,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961589.690, "dur": 3.088, + "args": { + "External id": 234823,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961592.082, "dur": 0.634, + "args": { + "External id": 234824,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961593.076, "dur": 1.175, + "args": { + "External id": 234825,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961593.464, "dur": 0.727, + "args": { + "External id": 234826,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961594.554, "dur": 1.211, + "args": { + "External id": 234827,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961594.927, "dur": 0.771, + "args": { + "External id": 234828,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961596.203, "dur": 2.954, + "args": { + "External id": 234829,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961598.450, "dur": 0.644, + "args": { + "External id": 234830,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961599.438, "dur": 1.120, + "args": { + "External id": 234831,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961599.824, "dur": 0.663, + "args": { + "External id": 234832,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961601.011, "dur": 2.876, + "args": { + "External id": 234833,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961601.380, "dur": 2.438, + "args": { + "External id": 234834,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961604.230, "dur": 1.298, + "args": { + "External id": 234835,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961604.980, "dur": 0.486, + "args": { + "External id": 234836,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961605.778, "dur": 0.981, + "args": { + "External id": 234837,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961606.142, "dur": 0.551, + "args": { + "External id": 234838,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961607.029, "dur": 3.838, + "args": { + "External id": 234839,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961610.407, "dur": 0.397, + "args": { + "External id": 234840,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961611.141, "dur": 0.734, + "args": { + "External id": 234841,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961611.500, "dur": 0.314, + "args": { + "External id": 234842,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961612.178, "dur": 1.003, + "args": { + "External id": 234843,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961612.565, "dur": 0.548, + "args": { + "External id": 234844,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961613.529, "dur": 3.003, + "args": { + "External id": 234845,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961616.043, "dur": 0.426, + "args": { + "External id": 234846,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961616.834, "dur": 1.226, + "args": { + "External id": 234847,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961617.223, "dur": 0.773, + "args": { + "External id": 234848,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961618.383, "dur": 2.672, + "args": { + "External id": 234849,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961618.757, "dur": 2.226, + "args": { + "External id": 234850,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961621.314, "dur": 1.380, + "args": { + "External id": 234851,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961622.060, "dur": 0.574, + "args": { + "External id": 234852,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961622.948, "dur": 0.788, + "args": { + "External id": 234853,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961623.318, "dur": 0.352, + "args": { + "External id": 234854,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961623.994, "dur": 3.344, + "args": { + "External id": 234855,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961626.830, "dur": 0.448, + "args": { + "External id": 234856,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961627.629, "dur": 0.676, + "args": { + "External id": 234857,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961627.997, "dur": 0.247, + "args": { + "External id": 234858,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961628.570, "dur": 1.539, + "args": { + "External id": 234859,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961628.958, "dur": 1.082, + "args": { + "External id": 234860,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961630.596, "dur": 3.499, + "args": { + "External id": 234861,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961633.016, "dur": 1.007, + "args": { + "External id": 234862,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961634.389, "dur": 1.072, + "args": { + "External id": 234863,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961634.747, "dur": 0.652, + "args": { + "External id": 234864,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961635.893, "dur": 2.845, + "args": { + "External id": 234865,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961636.263, "dur": 2.401, + "args": { + "External id": 234866,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961639.000, "dur": 1.720, + "args": { + "External id": 234867,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961639.668, "dur": 0.986, + "args": { + "External id": 234868,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961641.058, "dur": 1.310, + "args": { + "External id": 234869,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961641.478, "dur": 0.822, + "args": { + "External id": 234870,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961642.627, "dur": 3.240, + "args": { + "External id": 234871,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961645.060, "dur": 0.737, + "args": { + "External id": 234872,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961646.129, "dur": 1.153, + "args": { + "External id": 234873,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961646.499, "dur": 0.720, + "args": { + "External id": 234874,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961647.540, "dur": 1.292, + "args": { + "External id": 234875,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961647.914, "dur": 0.855, + "args": { + "External id": 234876,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961649.115, "dur": 2.957, + "args": { + "External id": 234877,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961651.318, "dur": 0.686, + "args": { + "External id": 234878,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961652.329, "dur": 26.632, + "args": { + "External id": 234879,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961652.686, "dur": 25.517, + "args": { + "External id": 234880,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961680.341, "dur": 3.938, + "args": { + "External id": 234881,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961681.396, "dur": 2.792, + "args": { + "External id": 234882,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961684.570, "dur": 1.432, + "args": { + "External id": 234883,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961685.480, "dur": 0.461, + "args": { + "External id": 234884,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961686.282, "dur": 2.387, + "args": { + "External id": 234885,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961687.557, "dur": 1.041, + "args": { + "External id": 234886,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961688.969, "dur": 3.001, + "args": { + "External id": 234887,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961691.382, "dur": 0.525, + "args": { + "External id": 234888,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961692.305, "dur": 1.108, + "args": { + "External id": 234889,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961692.771, "dur": 0.578, + "args": { + "External id": 234890,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961693.691, "dur": 1.136, + "args": { + "External id": 234891,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961694.127, "dur": 0.630, + "args": { + "External id": 234892,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961695.106, "dur": 5.073, + "args": { + "External id": 234893,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961699.480, "dur": 0.638, + "args": { + "External id": 234894,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961700.471, "dur": 1.114, + "args": { + "External id": 234895,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961700.986, "dur": 0.535, + "args": { + "External id": 234896,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961701.888, "dur": 2.988, + "args": { + "External id": 234897,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961702.360, "dur": 2.440, + "args": { + "External id": 234898,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961705.136, "dur": 1.287, + "args": { + "External id": 234899,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961705.804, "dur": 0.557, + "args": { + "External id": 234900,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961706.739, "dur": 1.169, + "args": { + "External id": 234901,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961707.193, "dur": 0.642, + "args": { + "External id": 234902,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961708.191, "dur": 2.882, + "args": { + "External id": 234903,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961710.346, "dur": 0.667, + "args": { + "External id": 234904,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961711.380, "dur": 1.140, + "args": { + "External id": 234905,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961711.939, "dur": 0.520, + "args": { + "External id": 234906,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961712.879, "dur": 1.549, + "args": { + "External id": 234907,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961713.373, "dur": 0.986, + "args": { + "External id": 234908,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961714.934, "dur": 3.452, + "args": { + "External id": 234909,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961717.608, "dur": 0.714, + "args": { + "External id": 234910,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961718.660, "dur": 1.260, + "args": { + "External id": 234911,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961719.184, "dur": 0.676, + "args": { + "External id": 234912,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961720.206, "dur": 2.815, + "args": { + "External id": 234913,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961720.665, "dur": 2.278, + "args": { + "External id": 234914,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961723.278, "dur": 1.240, + "args": { + "External id": 234915,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961723.737, "dur": 0.717, + "args": { + "External id": 234916,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961724.779, "dur": 1.340, + "args": { + "External id": 234917,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961725.383, "dur": 0.667, + "args": { + "External id": 234918,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961726.396, "dur": 2.955, + "args": { + "External id": 234919,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961728.904, "dur": 0.385, + "args": { + "External id": 234920,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961729.666, "dur": 0.975, + "args": { + "External id": 234921,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961730.096, "dur": 0.481, + "args": { + "External id": 234922,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961730.924, "dur": 1.488, + "args": { + "External id": 234923,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961731.350, "dur": 0.989, + "args": { + "External id": 234924,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961732.685, "dur": 3.250, + "args": { + "External id": 234925,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961735.343, "dur": 0.530, + "args": { + "External id": 234926,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961736.351, "dur": 1.220, + "args": { + "External id": 234927,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961736.842, "dur": 0.669, + "args": { + "External id": 234928,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961737.869, "dur": 2.607, + "args": { + "External id": 234929,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961738.321, "dur": 2.077, + "args": { + "External id": 234930,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961740.735, "dur": 1.173, + "args": { + "External id": 234931,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961741.158, "dur": 0.688, + "args": { + "External id": 234932,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961742.364, "dur": 1.224, + "args": { + "External id": 234933,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961742.822, "dur": 0.693, + "args": { + "External id": 234934,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961743.868, "dur": 3.176, + "args": { + "External id": 234935,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961746.209, "dur": 0.770, + "args": { + "External id": 234936,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961747.364, "dur": 1.079, + "args": { + "External id": 234937,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961747.784, "dur": 0.595, + "args": { + "External id": 234938,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961748.813, "dur": 1.053, + "args": { + "External id": 234939,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961749.237, "dur": 0.560, + "args": { + "External id": 234940,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961750.146, "dur": 2.892, + "args": { + "External id": 234941,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961752.293, "dur": 0.684, + "args": { + "External id": 234942,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961753.309, "dur": 0.950, + "args": { + "External id": 234943,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961753.741, "dur": 0.458, + "args": { + "External id": 234944,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961754.564, "dur": 2.800, + "args": { + "External id": 234945,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961755.011, "dur": 2.278, + "args": { + "External id": 234946,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961757.637, "dur": 0.965, + "args": { + "External id": 234947,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961758.050, "dur": 0.491, + "args": { + "External id": 234948,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961758.857, "dur": 1.204, + "args": { + "External id": 234949,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961759.310, "dur": 0.687, + "args": { + "External id": 234950,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961760.337, "dur": 2.994, + "args": { + "External id": 234951,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961762.651, "dur": 0.617, + "args": { + "External id": 234952,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961763.635, "dur": 1.038, + "args": { + "External id": 234953,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961764.070, "dur": 0.540, + "args": { + "External id": 234954,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961765.133, "dur": 1.104, + "args": { + "External id": 234955,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961765.560, "dur": 0.607, + "args": { + "External id": 234956,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961766.491, "dur": 2.861, + "args": { + "External id": 234957,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961768.523, "dur": 0.766, + "args": { + "External id": 234958,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961769.628, "dur": 1.069, + "args": { + "External id": 234959,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961770.070, "dur": 0.566, + "args": { + "External id": 234960,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961770.970, "dur": 2.886, + "args": { + "External id": 234961,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961771.390, "dur": 2.392, + "args": { + "External id": 234962,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961774.115, "dur": 1.280, + "args": { + "External id": 234963,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961774.559, "dur": 0.772, + "args": { + "External id": 234964,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961775.859, "dur": 1.104, + "args": { + "External id": 234965,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961776.346, "dur": 0.546, + "args": { + "External id": 234966,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961777.437, "dur": 3.209, + "args": { + "External id": 234967,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961779.795, "dur": 0.790, + "args": { + "External id": 234968,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961780.949, "dur": 1.045, + "args": { + "External id": 234969,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961781.397, "dur": 0.532, + "args": { + "External id": 234970,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961782.270, "dur": 1.332, + "args": { + "External id": 234971,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961782.777, "dur": 0.754, + "args": { + "External id": 234972,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961783.869, "dur": 2.539, + "args": { + "External id": 234973,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961785.746, "dur": 0.596, + "args": { + "External id": 234974,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961786.712, "dur": 1.419, + "args": { + "External id": 234975,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961787.259, "dur": 0.811, + "args": { + "External id": 234976,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961788.417, "dur": 2.651, + "args": { + "External id": 234977,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961788.922, "dur": 2.072, + "args": { + "External id": 234978,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961791.333, "dur": 1.033, + "args": { + "External id": 234979,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961791.774, "dur": 0.530, + "args": { + "External id": 234980,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961792.623, "dur": 1.088, + "args": { + "External id": 234981,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961793.036, "dur": 0.606, + "args": { + "External id": 234982,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961793.980, "dur": 2.719, + "args": { + "External id": 234983,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961796.100, "dur": 0.534, + "args": { + "External id": 234984,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961796.979, "dur": 1.364, + "args": { + "External id": 234985,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961797.457, "dur": 0.825, + "args": { + "External id": 234986,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961798.613, "dur": 1.029, + "args": { + "External id": 234987,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961799.020, "dur": 0.551, + "args": { + "External id": 234988,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961799.986, "dur": 3.349, + "args": { + "External id": 234989,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961802.548, "dur": 0.725, + "args": { + "External id": 234990,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961803.602, "dur": 1.146, + "args": { + "External id": 234991,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961804.011, "dur": 0.675, + "args": { + "External id": 234992,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961805.011, "dur": 3.004, + "args": { + "External id": 234993,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961805.486, "dur": 2.456, + "args": { + "External id": 234994,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961808.269, "dur": 1.341, + "args": { + "External id": 234995,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961808.723, "dur": 0.826, + "args": { + "External id": 234996,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961809.957, "dur": 1.211, + "args": { + "External id": 234997,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961810.390, "dur": 0.718, + "args": { + "External id": 234998,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961811.438, "dur": 2.932, + "args": { + "External id": 234999,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961813.751, "dur": 0.559, + "args": { + "External id": 235000,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961814.651, "dur": 1.052, + "args": { + "External id": 235001,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961815.128, "dur": 0.511, + "args": { + "External id": 235002,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961816.013, "dur": 1.234, + "args": { + "External id": 235003,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961816.448, "dur": 0.731, + "args": { + "External id": 235004,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961817.562, "dur": 3.246, + "args": { + "External id": 235005,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961819.971, "dur": 0.773, + "args": { + "External id": 235006,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961821.084, "dur": 1.149, + "args": { + "External id": 235007,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961821.535, "dur": 0.638, + "args": { + "External id": 235008,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961847.055, "dur": 8.160, + "args": { + "External id": 235009,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961852.949, "dur": 2.190, + "args": { + "External id": 235010,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961855.514, "dur": 1.120, + "args": { + "External id": 235011,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961856.168, "dur": 0.403, + "args": { + "External id": 235012,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961856.946, "dur": 1.185, + "args": { + "External id": 235013,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961857.427, "dur": 0.633, + "args": { + "External id": 235014,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961858.399, "dur": 3.215, + "args": { + "External id": 235015,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961860.910, "dur": 0.642, + "args": { + "External id": 235016,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961861.946, "dur": 1.480, + "args": { + "External id": 235017,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961862.764, "dur": 0.599, + "args": { + "External id": 235018,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961863.696, "dur": 1.258, + "args": { + "External id": 235019,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961864.121, "dur": 0.770, + "args": { + "External id": 235020,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961865.209, "dur": 2.922, + "args": { + "External id": 235021,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961867.527, "dur": 0.543, + "args": { + "External id": 235022,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961868.407, "dur": 1.434, + "args": { + "External id": 235023,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961869.072, "dur": 0.705, + "args": { + "External id": 235024,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961870.105, "dur": 2.713, + "args": { + "External id": 235025,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961870.559, "dur": 2.185, + "args": { + "External id": 235026,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961873.105, "dur": 1.077, + "args": { + "External id": 235027,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961873.564, "dur": 0.555, + "args": { + "External id": 235028,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961874.472, "dur": 1.093, + "args": { + "External id": 235029,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961874.932, "dur": 0.563, + "args": { + "External id": 235030,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961875.834, "dur": 2.922, + "args": { + "External id": 235031,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961878.078, "dur": 0.612, + "args": { + "External id": 235032,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961879.032, "dur": 1.479, + "args": { + "External id": 235033,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961879.659, "dur": 0.788, + "args": { + "External id": 235034,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961880.783, "dur": 6.549, + "args": { + "External id": 235035,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961885.245, "dur": 2.022, + "args": { + "External id": 235036,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961887.631, "dur": 1.447, + "args": { + "External id": 235037,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961888.087, "dur": 0.928, + "args": { + "External id": 235038,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961889.352, "dur": 1.497, + "args": { + "External id": 235039,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961889.798, "dur": 0.980, + "args": { + "External id": 235040,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961891.138, "dur": 4.556, + "args": { + "External id": 235041,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961894.696, "dur": 0.933, + "args": { + "External id": 235042,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961895.994, "dur": 1.425, + "args": { + "External id": 235043,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961896.783, "dur": 0.574, + "args": { + "External id": 235044,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961897.683, "dur": 1.742, + "args": { + "External id": 235045,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961898.581, "dur": 0.776, + "args": { + "External id": 235046,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961899.860, "dur": 3.151, + "args": { + "External id": 235047,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961902.378, "dur": 0.569, + "args": { + "External id": 235048,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961903.444, "dur": 1.634, + "args": { + "External id": 235049,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961904.623, "dur": 0.393, + "args": { + "External id": 235050,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961905.357, "dur": 2.515, + "args": { + "External id": 235051,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961905.965, "dur": 1.834, + "args": { + "External id": 235052,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961908.315, "dur": 1.423, + "args": { + "External id": 235053,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961909.179, "dur": 0.496, + "args": { + "External id": 235054,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961909.994, "dur": 1.758, + "args": { + "External id": 235055,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961910.585, "dur": 1.106, + "args": { + "External id": 235056,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961912.224, "dur": 3.318, + "args": { + "External id": 235057,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961914.898, "dur": 0.576, + "args": { + "External id": 235058,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183442, "tid": 4183442, + "ts": 667115961915.836, "dur": 1.530, + "args": { + "External id": 235059,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115961916.650, "dur": 0.650, + "args": { + "External id": 235060,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 4183442, "tid": 4183442, + "ts": 667115961936.665, "dur": 102.786, + "args": { + "External id": 235061,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 4183442, "tid": 4183442, + "ts": 667115962126.200, "dur": 125.641, + "args": { + "External id": 235062,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[219], [], [], [], []], "Ev Idx": 9253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 4183442, "tid": 4183442, + "ts": 667115962187.357, "dur": 45.018, + "args": { + "External id": 235063,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[219], [], [], [], []], "Ev Idx": 9254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183442, "tid": 4183442, + "ts": 667115962200.008, "dur": 1.082, + "args": { + "External id": 235064,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Redistribute", "pid": 4183442, "tid": 4183442, + "ts": 667115962587.394, "dur": 884.144, + "args": { + "External id": 235065,"Sequence number": 2757964, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "False"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 4183442, "tid": 4183442, + "ts": 667115962641.425, "dur": 77.517, + "args": { + "External id": 235066,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115962645.855, "dur": 1.348, + "args": { + "External id": 235067,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115962649.329, "dur": 0.555, + "args": { + "External id": 235068,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::all_reduce", "pid": 4183442, "tid": 4183442, + "ts": 667115962746.707, "dur": 433.512, + "args": { + "External id": 235069,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["float", "", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183442, "tid": 4183442, + "ts": 667115962750.378, "dur": 45.251, + "args": { + "External id": 235070,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183442, "tid": 4183442, + "ts": 667115962753.858, "dur": 8.754, + "args": { + "External id": 235071,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "0"], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115962757.929, "dur": 3.918, + "args": { + "External id": 235072,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183442, "tid": 4183442, + "ts": 667115962764.451, "dur": 30.680, + "args": { + "External id": 235073,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::allreduce_", "pid": 4183442, "tid": 4183442, + "ts": 667115962805.795, "dur": 371.438, + "args": { + "External id": 235074,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "-1"], "Input type": ["TensorList", "", "", "", "Scalar"], "Input Strides": [[[]], [], [], [], []], "Input Dims": [[[]], [], [], [], []], "Ev Idx": 9265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115962835.118, "dur": 336.111, + "args": { + "External id": 235075,"Record function id": 0, "Collective name": "allreduce", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[[]], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1, "Process Group Name": "0", "Input type": ["TensorList", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[[]], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 9266, "In msg nelems": 1 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:all_reduce", "pid": 4183442, "tid": 4183442, + "ts": 667115962852.266, "dur": 313.352, + "args": { + "External id": 235076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 4183442, "tid": 4183442, + "ts": 667115963241.266, "dur": 192.215, + "args": { + "External id": 235077,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::wait_tensor", "pid": 4183442, "tid": 4183442, + "ts": 667115963335.044, "dur": 26.524, + "args": { + "External id": 235078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183442, "tid": 4183442, + "ts": 667115963348.970, "dur": 4.548, + "args": { + "External id": 235079,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 9270, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 4183442, "tid": 4183442, + "ts": 667115963390.652, "dur": 37.124, + "args": { + "External id": 235080,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115963392.896, "dur": 1.136, + "args": { + "External id": 235081,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115963395.528, "dur": 0.715, + "args": { + "External id": 235082,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "_ToTorchTensor", "pid": 4183442, "tid": 4183442, + "ts": 667115963487.456, "dur": 45.855, + "args": { + "External id": 235083,"Sequence number": 2757965, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183442, "tid": 4183442, + "ts": 667115963519.557, "dur": 9.179, + "args": { + "External id": 235084,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183442, "tid": 4183442, + "ts": 667115963522.369, "dur": 6.006, + "args": { + "External id": 235085,"Record function id": 0, "Concrete Inputs": ["", "[]"], "Input type": ["float", "ScalarList"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183442, "tid": 4183442, + "ts": 667115963995.796, "dur": 40.651, + "args": { + "External id": 235086,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "double", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reciprocal", "pid": 4183442, "tid": 4183442, + "ts": 667115964047.601, "dur": 27.511, + "args": { + "External id": 235087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mul", "pid": 4183442, "tid": 4183442, + "ts": 667115964084.743, "dur": 24.803, + "args": { + "External id": 235088,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "double"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clamp", "pid": 4183442, "tid": 4183442, + "ts": 667115964123.681, "dur": 24.248, + "args": { + "External id": 235089,"Record function id": 0, "Concrete Inputs": ["", "", "1."], "Input type": ["float", "", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115964127.688, "dur": 0.879, + "args": { + "External id": 235090,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183442, "tid": 4183442, + "ts": 667115964165.184, "dur": 0.394, + "args": { + "External id": 235091,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 9282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 4183442, "tid": 4183442, + "ts": 667115964261.913, "dur": 562.263, + "args": { + "External id": 235092,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 4183442, "tid": 4183442, + "ts": 667115964724.588, "dur": 70.113, + "args": { + "External id": 235093,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::isnan", "pid": 4183442, "tid": 4183442, + "ts": 667115964863.703, "dur": 28.677, + "args": { + "External id": 235094,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183442, "tid": 4183442, + "ts": 667115964868.172, "dur": 23.660, + "args": { + "External id": 235095,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183442, "tid": 4183442, + "ts": 667115964896.909, "dur": 61.529, + "args": { + "External id": 235096,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 4183442, + "ts": 667115964898.764, "dur": 59.493, + "args": { + "External id": 235097,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 4183442, + "ts": 667115964900.565, "dur": 57.369, + "args": { + "External id": 235098,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::isinf", "pid": 4183442, "tid": 4183442, + "ts": 667115964963.449, "dur": 52.448, + "args": { + "External id": 235099,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115964966.501, "dur": 29.869, + "args": { + "External id": 235100,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183442, "tid": 4183442, + "ts": 667115964972.315, "dur": 2.773, + "args": { + "External id": 235101,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183442, "tid": 4183442, + "ts": 667115964976.636, "dur": 19.371, + "args": { + "External id": 235102,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], [1]], "Input Dims": [[], [0]], "Ev Idx": 9293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183442, "tid": 4183442, + "ts": 667115964981.251, "dur": 2.400, + "args": { + "External id": 235103,"Record function id": 0, "Concrete Inputs": ["", "[]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183442, "tid": 4183442, + "ts": 667115964998.629, "dur": 16.504, + "args": { + "External id": 235104,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183442, "tid": 4183442, + "ts": 667115965018.062, "dur": 36.838, + "args": { + "External id": 235105,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183442, "tid": 4183442, + "ts": 667115965019.052, "dur": 35.707, + "args": { + "External id": 235106,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183442, "tid": 4183442, + "ts": 667115965019.823, "dur": 34.637, + "args": { + "External id": 235107,"Sequence number": 2757966, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9298 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#OptimizersContainer.step", "pid": 4183442, "tid": 4183442, + "ts": 667115965085.168, "dur": 4467.509, + "args": { + "External id": 235108,"Record function id": 0, "Ev Idx": 9299 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#AdamW.step", "pid": 4183442, "tid": 4183442, + "ts": 667115965118.453, "dur": 4411.988, + "args": { + "External id": 235109,"Record function id": 0, "Ev Idx": 9300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_add_", "pid": 4183442, "tid": 4183442, + "ts": 667115966144.991, "dur": 197.987, + "args": { + "External id": 235110,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966160.942, "dur": 1.111, + "args": { + "External id": 235111,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966163.115, "dur": 0.538, + "args": { + "External id": 235112,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966164.162, "dur": 0.278, + "args": { + "External id": 235113,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966164.981, "dur": 0.292, + "args": { + "External id": 235114,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966165.628, "dur": 0.065, + "args": { + "External id": 235115,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966166.047, "dur": 0.220, + "args": { + "External id": 235116,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966166.630, "dur": 0.192, + "args": { + "External id": 235117,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966167.248, "dur": 0.057, + "args": { + "External id": 235118,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966167.783, "dur": 0.228, + "args": { + "External id": 235119,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966168.433, "dur": 0.194, + "args": { + "External id": 235120,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966168.944, "dur": 0.094, + "args": { + "External id": 235121,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966169.460, "dur": 0.100, + "args": { + "External id": 235122,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966170.006, "dur": 0.054, + "args": { + "External id": 235123,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966170.381, "dur": 0.132, + "args": { + "External id": 235124,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966170.940, "dur": 0.180, + "args": { + "External id": 235125,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966171.413, "dur": 0.217, + "args": { + "External id": 235126,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966171.995, "dur": 0.102, + "args": { + "External id": 235127,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966172.566, "dur": 0.107, + "args": { + "External id": 235128,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966173.065, "dur": 0.078, + "args": { + "External id": 235129,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966173.569, "dur": 0.070, + "args": { + "External id": 235130,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966174.044, "dur": 0.066, + "args": { + "External id": 235131,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966174.501, "dur": 0.065, + "args": { + "External id": 235132,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966174.937, "dur": 0.065, + "args": { + "External id": 235133,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966175.363, "dur": 0.063, + "args": { + "External id": 235134,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966175.757, "dur": 0.066, + "args": { + "External id": 235135,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966176.166, "dur": 0.073, + "args": { + "External id": 235136,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966176.555, "dur": 0.065, + "args": { + "External id": 235137,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966176.975, "dur": 0.104, + "args": { + "External id": 235138,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966177.435, "dur": 0.064, + "args": { + "External id": 235139,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966177.817, "dur": 0.062, + "args": { + "External id": 235140,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966178.256, "dur": 0.065, + "args": { + "External id": 235141,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966178.694, "dur": 0.065, + "args": { + "External id": 235142,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966179.081, "dur": 0.065, + "args": { + "External id": 235143,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966179.528, "dur": 0.065, + "args": { + "External id": 235144,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966179.920, "dur": 0.070, + "args": { + "External id": 235145,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966180.457, "dur": 0.066, + "args": { + "External id": 235146,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966180.968, "dur": 0.060, + "args": { + "External id": 235147,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966181.354, "dur": 0.065, + "args": { + "External id": 235148,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966181.899, "dur": 0.060, + "args": { + "External id": 235149,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966182.378, "dur": 0.067, + "args": { + "External id": 235150,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966182.806, "dur": 0.094, + "args": { + "External id": 235151,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966183.270, "dur": 0.096, + "args": { + "External id": 235152,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966183.738, "dur": 0.213, + "args": { + "External id": 235153,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966184.332, "dur": 0.195, + "args": { + "External id": 235154,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966184.966, "dur": 0.063, + "args": { + "External id": 235155,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966185.375, "dur": 0.248, + "args": { + "External id": 235156,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966186.102, "dur": 0.082, + "args": { + "External id": 235157,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966186.579, "dur": 0.081, + "args": { + "External id": 235158,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966186.970, "dur": 0.101, + "args": { + "External id": 235159,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966187.417, "dur": 0.096, + "args": { + "External id": 235160,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966187.861, "dur": 0.098, + "args": { + "External id": 235161,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966188.282, "dur": 0.057, + "args": { + "External id": 235162,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966188.726, "dur": 0.066, + "args": { + "External id": 235163,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966189.343, "dur": 0.063, + "args": { + "External id": 235164,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966189.699, "dur": 0.063, + "args": { + "External id": 235165,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966190.106, "dur": 0.066, + "args": { + "External id": 235166,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966190.522, "dur": 0.067, + "args": { + "External id": 235167,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966190.951, "dur": 0.090, + "args": { + "External id": 235168,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966191.420, "dur": 0.051, + "args": { + "External id": 235169,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966191.815, "dur": 0.064, + "args": { + "External id": 235170,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966192.279, "dur": 0.061, + "args": { + "External id": 235171,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966192.921, "dur": 0.065, + "args": { + "External id": 235172,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966193.311, "dur": 0.067, + "args": { + "External id": 235173,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966193.744, "dur": 0.067, + "args": { + "External id": 235174,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966194.175, "dur": 0.135, + "args": { + "External id": 235175,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966194.634, "dur": 0.097, + "args": { + "External id": 235176,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966195.122, "dur": 0.224, + "args": { + "External id": 235177,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966195.728, "dur": 0.091, + "args": { + "External id": 235178,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966196.184, "dur": 0.061, + "args": { + "External id": 235179,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966196.604, "dur": 0.067, + "args": { + "External id": 235180,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966196.941, "dur": 0.081, + "args": { + "External id": 235181,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966197.418, "dur": 0.080, + "args": { + "External id": 235182,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966197.809, "dur": 0.102, + "args": { + "External id": 235183,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966198.270, "dur": 0.341, + "args": { + "External id": 235184,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966199.066, "dur": 0.063, + "args": { + "External id": 235185,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966199.472, "dur": 0.066, + "args": { + "External id": 235186,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966199.878, "dur": 0.062, + "args": { + "External id": 235187,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966200.334, "dur": 0.061, + "args": { + "External id": 235188,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966200.699, "dur": 0.063, + "args": { + "External id": 235189,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966201.299, "dur": 0.100, + "args": { + "External id": 235190,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966201.751, "dur": 0.068, + "args": { + "External id": 235191,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966202.268, "dur": 0.059, + "args": { + "External id": 235192,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966202.665, "dur": 0.066, + "args": { + "External id": 235193,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966203.199, "dur": 0.064, + "args": { + "External id": 235194,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966203.637, "dur": 0.064, + "args": { + "External id": 235195,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966204.058, "dur": 0.063, + "args": { + "External id": 235196,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966204.437, "dur": 0.060, + "args": { + "External id": 235197,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966204.843, "dur": 0.061, + "args": { + "External id": 235198,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966205.231, "dur": 0.065, + "args": { + "External id": 235199,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966205.734, "dur": 0.064, + "args": { + "External id": 235200,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966206.268, "dur": 0.066, + "args": { + "External id": 235201,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966206.788, "dur": 0.069, + "args": { + "External id": 235202,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966207.279, "dur": 0.064, + "args": { + "External id": 235203,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966207.737, "dur": 0.057, + "args": { + "External id": 235204,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966208.217, "dur": 0.059, + "args": { + "External id": 235205,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966208.630, "dur": 0.062, + "args": { + "External id": 235206,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966209.048, "dur": 0.067, + "args": { + "External id": 235207,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966209.432, "dur": 0.067, + "args": { + "External id": 235208,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966209.831, "dur": 0.207, + "args": { + "External id": 235209,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966210.427, "dur": 0.077, + "args": { + "External id": 235210,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966210.824, "dur": 0.062, + "args": { + "External id": 235211,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966211.543, "dur": 0.094, + "args": { + "External id": 235212,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966212.005, "dur": 0.047, + "args": { + "External id": 235213,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966212.387, "dur": 0.061, + "args": { + "External id": 235214,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966212.859, "dur": 0.093, + "args": { + "External id": 235215,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966213.415, "dur": 0.197, + "args": { + "External id": 235216,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966213.956, "dur": 0.092, + "args": { + "External id": 235217,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966214.391, "dur": 0.215, + "args": { + "External id": 235218,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966214.895, "dur": 0.064, + "args": { + "External id": 235219,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966215.319, "dur": 0.187, + "args": { + "External id": 235220,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966215.915, "dur": 0.058, + "args": { + "External id": 235221,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966216.444, "dur": 0.063, + "args": { + "External id": 235222,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966216.966, "dur": 0.062, + "args": { + "External id": 235223,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966217.528, "dur": 0.063, + "args": { + "External id": 235224,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966218.024, "dur": 0.060, + "args": { + "External id": 235225,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966218.579, "dur": 0.059, + "args": { + "External id": 235226,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966219.116, "dur": 0.064, + "args": { + "External id": 235227,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966219.607, "dur": 0.062, + "args": { + "External id": 235228,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966219.974, "dur": 0.065, + "args": { + "External id": 235229,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966220.397, "dur": 0.067, + "args": { + "External id": 235230,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966220.741, "dur": 0.068, + "args": { + "External id": 235231,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966221.188, "dur": 0.064, + "args": { + "External id": 235232,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966221.624, "dur": 0.062, + "args": { + "External id": 235233,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966222.024, "dur": 0.063, + "args": { + "External id": 235234,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966222.485, "dur": 0.062, + "args": { + "External id": 235235,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966222.872, "dur": 0.060, + "args": { + "External id": 235236,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966223.266, "dur": 0.064, + "args": { + "External id": 235237,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966223.708, "dur": 0.063, + "args": { + "External id": 235238,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966224.082, "dur": 0.089, + "args": { + "External id": 235239,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966224.532, "dur": 0.066, + "args": { + "External id": 235240,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966224.951, "dur": 0.060, + "args": { + "External id": 235241,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966225.553, "dur": 0.053, + "args": { + "External id": 235242,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966225.927, "dur": 0.063, + "args": { + "External id": 235243,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966226.521, "dur": 0.059, + "args": { + "External id": 235244,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966227.073, "dur": 0.057, + "args": { + "External id": 235245,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966227.548, "dur": 0.062, + "args": { + "External id": 235246,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966228.037, "dur": 0.065, + "args": { + "External id": 235247,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966228.570, "dur": 0.059, + "args": { + "External id": 235248,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966228.966, "dur": 0.191, + "args": { + "External id": 235249,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966229.523, "dur": 0.213, + "args": { + "External id": 235250,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966230.110, "dur": 0.062, + "args": { + "External id": 235251,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966230.535, "dur": 0.073, + "args": { + "External id": 235252,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966230.892, "dur": 0.062, + "args": { + "External id": 235253,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966231.292, "dur": 0.065, + "args": { + "External id": 235254,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966231.633, "dur": 0.089, + "args": { + "External id": 235255,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966232.179, "dur": 0.086, + "args": { + "External id": 235256,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966232.617, "dur": 0.113, + "args": { + "External id": 235257,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966233.044, "dur": 0.094, + "args": { + "External id": 235258,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966233.500, "dur": 0.064, + "args": { + "External id": 235259,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966234.117, "dur": 0.066, + "args": { + "External id": 235260,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966234.538, "dur": 0.061, + "args": { + "External id": 235261,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966234.867, "dur": 0.065, + "args": { + "External id": 235262,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966235.229, "dur": 0.068, + "args": { + "External id": 235263,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966235.601, "dur": 0.064, + "args": { + "External id": 235264,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966236.074, "dur": 0.061, + "args": { + "External id": 235265,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966236.676, "dur": 0.067, + "args": { + "External id": 235266,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966237.105, "dur": 0.063, + "args": { + "External id": 235267,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966237.543, "dur": 0.065, + "args": { + "External id": 235268,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966237.918, "dur": 0.064, + "args": { + "External id": 235269,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966238.297, "dur": 0.064, + "args": { + "External id": 235270,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966238.721, "dur": 0.062, + "args": { + "External id": 235271,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966239.344, "dur": 0.071, + "args": { + "External id": 235272,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966240.006, "dur": 0.068, + "args": { + "External id": 235273,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966240.421, "dur": 0.060, + "args": { + "External id": 235274,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966240.826, "dur": 0.063, + "args": { + "External id": 235275,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966241.156, "dur": 0.067, + "args": { + "External id": 235276,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966241.572, "dur": 0.066, + "args": { + "External id": 235277,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966241.946, "dur": 0.065, + "args": { + "External id": 235278,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966242.361, "dur": 0.054, + "args": { + "External id": 235279,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966242.737, "dur": 0.064, + "args": { + "External id": 235280,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966243.243, "dur": 0.069, + "args": { + "External id": 235281,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966243.732, "dur": 0.061, + "args": { + "External id": 235282,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966244.041, "dur": 0.054, + "args": { + "External id": 235283,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966244.728, "dur": 0.064, + "args": { + "External id": 235284,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966245.106, "dur": 0.063, + "args": { + "External id": 235285,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966245.655, "dur": 0.057, + "args": { + "External id": 235286,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966245.954, "dur": 0.060, + "args": { + "External id": 235287,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966246.685, "dur": 0.065, + "args": { + "External id": 235288,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966246.987, "dur": 0.054, + "args": { + "External id": 235289,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966247.530, "dur": 0.066, + "args": { + "External id": 235290,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966247.835, "dur": 0.053, + "args": { + "External id": 235291,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966248.397, "dur": 0.062, + "args": { + "External id": 235292,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966248.700, "dur": 0.056, + "args": { + "External id": 235293,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966249.336, "dur": 0.064, + "args": { + "External id": 235294,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966249.643, "dur": 0.084, + "args": { + "External id": 235295,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966250.314, "dur": 0.101, + "args": { + "External id": 235296,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966250.656, "dur": 0.319, + "args": { + "External id": 235297,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966251.814, "dur": 0.093, + "args": { + "External id": 235298,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966252.152, "dur": 0.055, + "args": { + "External id": 235299,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966252.654, "dur": 0.083, + "args": { + "External id": 235300,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966252.974, "dur": 0.054, + "args": { + "External id": 235301,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966253.641, "dur": 0.056, + "args": { + "External id": 235302,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966253.939, "dur": 0.077, + "args": { + "External id": 235303,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966254.670, "dur": 0.064, + "args": { + "External id": 235304,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966254.980, "dur": 0.049, + "args": { + "External id": 235305,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966255.672, "dur": 0.067, + "args": { + "External id": 235306,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966255.976, "dur": 0.052, + "args": { + "External id": 235307,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966256.836, "dur": 0.062, + "args": { + "External id": 235308,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966257.143, "dur": 0.050, + "args": { + "External id": 235309,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966257.761, "dur": 0.063, + "args": { + "External id": 235310,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966258.070, "dur": 0.052, + "args": { + "External id": 235311,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966258.753, "dur": 0.063, + "args": { + "External id": 235312,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966259.064, "dur": 0.051, + "args": { + "External id": 235313,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966259.597, "dur": 0.070, + "args": { + "External id": 235314,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966259.907, "dur": 0.053, + "args": { + "External id": 235315,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966260.572, "dur": 0.064, + "args": { + "External id": 235316,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966260.883, "dur": 0.056, + "args": { + "External id": 235317,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966261.533, "dur": 0.068, + "args": { + "External id": 235318,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966261.842, "dur": 0.054, + "args": { + "External id": 235319,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966262.353, "dur": 0.065, + "args": { + "External id": 235320,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966262.706, "dur": 0.055, + "args": { + "External id": 235321,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966263.402, "dur": 0.065, + "args": { + "External id": 235322,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966263.712, "dur": 0.053, + "args": { + "External id": 235323,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966264.294, "dur": 0.068, + "args": { + "External id": 235324,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966264.608, "dur": 0.091, + "args": { + "External id": 235325,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966265.219, "dur": 0.064, + "args": { + "External id": 235326,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966265.530, "dur": 0.053, + "args": { + "External id": 235327,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966266.314, "dur": 0.062, + "args": { + "External id": 235328,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183442, "tid": 4183442, + "ts": 667115966266.625, "dur": 0.057, + "args": { + "External id": 235329,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 4183442, "tid": 4183442, + "ts": 667115966764.936, "dur": 2670.949, + "args": { + "External id": 235330,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.00029143140233429938", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 9521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 4183442, "tid": 4183442, + "ts": 667115969095.838, "dur": 219.826, + "args": { + "External id": 235331,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.00029143140233429938", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 9522 + } + }, + { + "name": "process_name", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 0, + "args": { + "name": "python3.12" + } + }, + { + "name": "process_labels", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 0, + "args": { + "labels": "CPU" + } + }, + { + "name": "process_sort_index", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 0, + "args": { + "sort_index": 4183442 + } + }, + { + "name": "thread_name", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 31331, + "args": { + "name": "thread 31331 (pt_autograd_6)" + } + }, + { + "name": "thread_sort_index", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 31331, + "args": { + "sort_index": 31331 + } + }, + { + "name": "thread_name", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 4183442, + "args": { + "name": "thread 4183442 (python3.12)" + } + }, + { + "name": "thread_sort_index", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 4183442, + "args": { + "sort_index": 4183442 + } + }, + { + "name": "thread_name", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 31331, + "args": { + "name": "thread 31331 (python3.12)" + } + }, + { + "name": "thread_sort_index", "ph": "M", "ts": 667115182889.512, "pid": 4183442, "tid": 31331, + "args": { + "sort_index": 31331 + } + }, + { + "ph": "X", "cat": "Trace", "ts": 667115182823.405, "dur": 786978.270, + "pid": "Spans", "tid": "PyTorch Profiler", + "name": "PyTorch Profiler (0)", + "args": { + "Op count": 0 + } + }, + { + "name": "process_sort_index", "ph": "M", "ts": 667115182823.405, + "pid": "Spans", "tid": 0, + "args": { + "sort_index": 536870912 + } + }, + { + "name": "Iteration Start: PyTorch Profiler", "ph": "i", "s": "g", + "pid": "Traces", "tid": "Trace PyTorch Profiler", "ts": 667115182823.405 + }, + { + "name": "Record Window End", "ph": "i", "s": "g", + "pid": "", "tid": "", "ts": 667116014983.203 + } + ], + "traceName": "exp/mtp.340M.batch16.seqlen4096.context4096.warmup1000.update1.steps100000.lr3e-4.cosine/profile_trace/iteration_12288/rank6_trace.json", + "displayTimeUnit": "ms", + "baseTimeNanoseconds": 1751410836000000000 +} \ No newline at end of file