diff --git "a/profile_trace/iteration_23552/rank5_trace.json" "b/profile_trace/iteration_23552/rank5_trace.json" new file mode 100644--- /dev/null +++ "b/profile_trace/iteration_23552/rank5_trace.json" @@ -0,0 +1,68515 @@ + +{ + "schemaVersion": 1, + "deviceProperties": [ + { + "id": 0, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 1, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 2, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 3, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 4, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 5, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 6, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + }, + { + "id": 7, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, + "computeMajor": 9, "computeMinor": 0, + "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, + "regsPerBlock": 65536, "warpSize": 32, + "sharedMemPerBlock": 49152, "numSms": 132 + , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 + } + ], + "cupti_version": 22, + "cuda_runtime_version": 12040, + "cuda_driver_version": 12080, + "distributedInfo": {"backend": "nccl", "rank": 5, "world_size": 8, "pg_count": 1, "pg_config": [{"pg_name": "0", "pg_desc": "default_pg", "backend_config": "cuda:nccl", "pg_size": 8, "ranks": [0, 1, 2, 3, 4, 5, 6, 7]}], "nccl_version": "2.21.5"}, + "record_shapes": 1, + "trace_id": "5B31EB726CC84DF7BB8449F5FC423B92", + "traceEvents": [ + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: DivBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007894759.867, "dur": 131.993, + "args": { + "External id": 446465,"Record function id": 0, "Sequence number": 5285602, "Fwd thread id": 1, "Ev Idx": 0 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "DivBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007894779.342, "dur": 102.348, + "args": { + "External id": 446466,"Sequence number": 5285602, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 1 + } + }, + { + "ph": "f", "id": 1, "pid": 4183441, "tid": 31362, "ts": 676007894779.342, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183441, "tid": 31362, + "ts": 676007894788.348, "dur": 90.936, + "args": { + "External id": 446467,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 2 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007894904.302, "dur": 292.573, + "args": { + "External id": 446468,"Record function id": 0, "Ev Idx": 3 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward", "pid": 4183441, "tid": 31362, + "ts": 676007894979.248, "dur": 124.452, + "args": { + "External id": 446469,"Record function id": 0, "Ev Idx": 4 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.19", "pid": 4183441, "tid": 31362, + "ts": 676007895018.509, "dur": 57.395, + "args": { + "External id": 446470,"Record function id": 0, "Ev Idx": 5 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007895110.085, "dur": 1.969, + "args": { + "External id": 446471,"Sequence number": 5285601, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6 + } + }, + { + "ph": "f", "id": 2, "pid": 4183441, "tid": 31362, "ts": 676007895110.085, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007895117.823, "dur": 67.311, + "args": { + "External id": 446472,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 7 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007895125.942, "dur": 58.633, + "args": { + "External id": 446473,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 8 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007895138.076, "dur": 7.224, + "args": { + "External id": 446474,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007895207.867, "dur": 16918.310, + "args": { + "External id": 446475,"Record function id": 0, "Sequence number": 5285599, "Fwd thread id": 1, "Ev Idx": 10 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007895209.875, "dur": 16904.650, + "args": { + "External id": 446476,"Sequence number": 5285599, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11 + } + }, + { + "ph": "f", "id": 3, "pid": 4183441, "tid": 31362, "ts": 676007895209.875, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007895260.091, "dur": 3.747, + "args": { + "External id": 446477,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 12 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007895268.954, "dur": 16712.522, + "args": { + "External id": 446478,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 13 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007895271.543, "dur": 16709.680, + "args": { + "External id": 446479,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 14 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007895276.597, "dur": 7.889, + "args": { + "External id": 446480,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 15 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007895286.969, "dur": 16692.363, + "args": { + "External id": 446481,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 16 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183441, "tid": 31362, + "ts": 676007911986.848, "dur": 0.517, + "args": { + "External id": 446482,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 17 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183441, "tid": 31362, + "ts": 676007911990.116, "dur": 3.232, + "args": { + "External id": 446483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 18 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183441, "tid": 31362, + "ts": 676007911991.843, "dur": 1.380, + "args": { + "External id": 446484,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 19 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 31362, + "ts": 676007911999.836, "dur": 34.777, + "args": { + "External id": 446485,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 20 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183441, "tid": 31362, + "ts": 676007912044.383, "dur": 59.932, + "args": { + "External id": 446486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 21 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 31362, + "ts": 676007912046.386, "dur": 57.738, + "args": { + "External id": 446487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 22 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 31362, + "ts": 676007912048.200, "dur": 55.206, + "args": { + "External id": 446488,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 23 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912138.819, "dur": 21.502, + "args": { + "External id": 446489,"Record function id": 0, "Sequence number": 5285598, "Fwd thread id": 1, "Ev Idx": 24 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912140.883, "dur": 15.183, + "args": { + "External id": 446490,"Sequence number": 5285598, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 25 + } + }, + { + "ph": "f", "id": 4, "pid": 4183441, "tid": 31362, "ts": 676007912140.883, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007912145.150, "dur": 10.732, + "args": { + "External id": 446491,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 26 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007912148.608, "dur": 7.086, + "args": { + "External id": 446492,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 27 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912164.521, "dur": 107.468, + "args": { + "External id": 446493,"Record function id": 0, "Sequence number": 5285597, "Fwd thread id": 1, "Ev Idx": 28 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912165.948, "dur": 97.914, + "args": { + "External id": 446494,"Sequence number": 5285597, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 29 + } + }, + { + "ph": "f", "id": 5, "pid": 4183441, "tid": 31362, "ts": 676007912165.948, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007912169.921, "dur": 93.332, + "args": { + "External id": 446495,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 30 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007912176.242, "dur": 40.494, + "args": { + "External id": 446496,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 31 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007912180.172, "dur": 7.251, + "args": { + "External id": 446497,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 32 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007912189.840, "dur": 26.568, + "args": { + "External id": 446498,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 33 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007912193.216, "dur": 22.654, + "args": { + "External id": 446499,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 34 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007912222.124, "dur": 4.524, + "args": { + "External id": 446500,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 35 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007912224.692, "dur": 1.624, + "args": { + "External id": 446501,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 36 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007912227.772, "dur": 34.592, + "args": { + "External id": 446502,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 37 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912276.623, "dur": 65.962, + "args": { + "External id": 446503,"Record function id": 0, "Sequence number": 5285596, "Fwd thread id": 1, "Ev Idx": 38 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912277.578, "dur": 59.773, + "args": { + "External id": 446504,"Sequence number": 5285596, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 39 + } + }, + { + "ph": "f", "id": 6, "pid": 4183441, "tid": 31362, "ts": 676007912277.578, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183441, "tid": 31362, + "ts": 676007912280.436, "dur": 56.668, + "args": { + "External id": 446505,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "3"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 40 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007912283.578, "dur": 23.446, + "args": { + "External id": 446506,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 41 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007912286.633, "dur": 2.954, + "args": { + "External id": 446507,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 42 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007912290.097, "dur": 16.666, + "args": { + "External id": 446508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 43 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007912293.016, "dur": 13.326, + "args": { + "External id": 446509,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 44 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007912310.875, "dur": 5.551, + "args": { + "External id": 446510,"Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 45 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007912314.685, "dur": 0.996, + "args": { + "External id": 446511,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 46 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007912317.445, "dur": 19.181, + "args": { + "External id": 446512,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 47 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912346.340, "dur": 110.980, + "args": { + "External id": 446513,"Record function id": 0, "Sequence number": 5285595, "Fwd thread id": 1, "Ev Idx": 48 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912347.533, "dur": 104.045, + "args": { + "External id": 446514,"Sequence number": 5285595, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 49 + } + }, + { + "ph": "f", "id": 7, "pid": 4183441, "tid": 31362, "ts": 676007912347.533, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007912349.443, "dur": 101.756, + "args": { + "External id": 446515,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 50 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007912354.753, "dur": 18.421, + "args": { + "External id": 446516,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 51 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007912355.537, "dur": 2.752, + "args": { + "External id": 446517,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 52 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007912358.888, "dur": 14.030, + "args": { + "External id": 446518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 53 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007912359.905, "dur": 12.644, + "args": { + "External id": 446519,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 54 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007912375.991, "dur": 3.927, + "args": { + "External id": 446520,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 55 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007912377.012, "dur": 2.757, + "args": { + "External id": 446521,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 56 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007912380.746, "dur": 69.588, + "args": { + "External id": 446522,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 57 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912462.580, "dur": 71.787, + "args": { + "External id": 446523,"Record function id": 0, "Sequence number": 5285594, "Fwd thread id": 1, "Ev Idx": 58 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912463.764, "dur": 66.966, + "args": { + "External id": 446524,"Sequence number": 5285594, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 59 + } + }, + { + "ph": "f", "id": 8, "pid": 4183441, "tid": 31362, "ts": 676007912463.764, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007912464.944, "dur": 65.571, + "args": { + "External id": 446525,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 60 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007912465.950, "dur": 16.927, + "args": { + "External id": 446526,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 61 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007912468.912, "dur": 1.816, + "args": { + "External id": 446527,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 62 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007912471.364, "dur": 11.259, + "args": { + "External id": 446528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 63 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007912472.038, "dur": 10.276, + "args": { + "External id": 446529,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 64 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007912483.851, "dur": 3.701, + "args": { + "External id": 446530,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 65 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007912486.575, "dur": 0.846, + "args": { + "External id": 446531,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 66 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007912489.753, "dur": 40.033, + "args": { + "External id": 446532,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 67 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912538.801, "dur": 34.093, + "args": { + "External id": 446533,"Record function id": 0, "Sequence number": 5285593, "Fwd thread id": 1, "Ev Idx": 68 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007912540.120, "dur": 0.805, + "args": { + "External id": 446534,"Sequence number": 5285593, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 69 + } + }, + { + "ph": "f", "id": 9, "pid": 4183441, "tid": 31362, "ts": 676007912540.120, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007912543.867, "dur": 24.665, + "args": { + "External id": 446535,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 70 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007912545.655, "dur": 22.390, + "args": { + "External id": 446536,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 71 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007912551.572, "dur": 0.441, + "args": { + "External id": 446537,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 72 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007912577.766, "dur": 1066.192, + "args": { + "External id": 446538,"Record function id": 0, "Sequence number": 5285591, "Fwd thread id": 1, "Ev Idx": 73 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007912579.658, "dur": 1029.154, + "args": { + "External id": 446539,"Sequence number": 5285591, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 74 + } + }, + { + "ph": "f", "id": 10, "pid": 4183441, "tid": 31362, "ts": 676007912579.658, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007912617.866, "dur": 2.467, + "args": { + "External id": 446540,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 75 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007912622.748, "dur": 902.196, + "args": { + "External id": 446541,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 76 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007912624.717, "dur": 899.898, + "args": { + "External id": 446542,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 77 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007912627.100, "dur": 4.649, + "args": { + "External id": 446543,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 78 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007912632.514, "dur": 891.200, + "args": { + "External id": 446544,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 79 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183441, "tid": 31362, + "ts": 676007913528.210, "dur": 0.352, + "args": { + "External id": 446545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 80 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183441, "tid": 31362, + "ts": 676007913529.943, "dur": 3.860, + "args": { + "External id": 446546,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 81 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183441, "tid": 31362, + "ts": 676007913532.896, "dur": 0.767, + "args": { + "External id": 446547,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 82 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 31362, + "ts": 676007913537.767, "dur": 21.372, + "args": { + "External id": 446548,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 83 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183441, "tid": 31362, + "ts": 676007913564.300, "dur": 37.619, + "args": { + "External id": 446549,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 84 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 31362, + "ts": 676007913565.344, "dur": 36.409, + "args": { + "External id": 446550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 85 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 31362, + "ts": 676007913566.495, "dur": 34.919, + "args": { + "External id": 446551,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 86 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007913619.362, "dur": 19.933, + "args": { + "External id": 446552,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 87 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913674.902, "dur": 18.211, + "args": { + "External id": 446553,"Record function id": 0, "Sequence number": 5285590, "Fwd thread id": 1, "Ev Idx": 88 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913677.045, "dur": 12.013, + "args": { + "External id": 446554,"Sequence number": 5285590, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 89 + } + }, + { + "ph": "f", "id": 11, "pid": 4183441, "tid": 31362, "ts": 676007913677.045, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007913681.772, "dur": 7.060, + "args": { + "External id": 446555,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 90 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007913684.820, "dur": 3.707, + "args": { + "External id": 446556,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 91 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913697.969, "dur": 62.868, + "args": { + "External id": 446557,"Record function id": 0, "Sequence number": 5285589, "Fwd thread id": 1, "Ev Idx": 92 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913698.955, "dur": 55.987, + "args": { + "External id": 446558,"Sequence number": 5285589, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 93 + } + }, + { + "ph": "f", "id": 12, "pid": 4183441, "tid": 31362, "ts": 676007913698.955, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007913700.594, "dur": 53.996, + "args": { + "External id": 446559,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 94 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007913702.580, "dur": 25.581, + "args": { + "External id": 446560,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 95 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007913705.518, "dur": 4.934, + "args": { + "External id": 446561,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 96 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007913711.339, "dur": 16.537, + "args": { + "External id": 446562,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 97 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007913712.445, "dur": 14.998, + "args": { + "External id": 446563,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 98 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007913729.520, "dur": 2.736, + "args": { + "External id": 446564,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 99 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007913731.249, "dur": 0.793, + "args": { + "External id": 446565,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007913733.089, "dur": 20.795, + "args": { + "External id": 446566,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913766.816, "dur": 59.704, + "args": { + "External id": 446567,"Record function id": 0, "Sequence number": 5285588, "Fwd thread id": 1, "Ev Idx": 102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913767.767, "dur": 54.021, + "args": { + "External id": 446568,"Sequence number": 5285588, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 103 + } + }, + { + "ph": "f", "id": 13, "pid": 4183441, "tid": 31362, "ts": 676007913767.767, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183441, "tid": 31362, + "ts": 676007913771.754, "dur": 49.741, + "args": { + "External id": 446569,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "2"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007913773.298, "dur": 17.579, + "args": { + "External id": 446570,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007913773.868, "dur": 2.120, + "args": { + "External id": 446571,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007913776.683, "dur": 13.905, + "args": { + "External id": 446572,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007913777.697, "dur": 12.445, + "args": { + "External id": 446573,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007913791.862, "dur": 5.436, + "args": { + "External id": 446574,"Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007913796.114, "dur": 0.663, + "args": { + "External id": 446575,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007913798.114, "dur": 22.848, + "args": { + "External id": 446576,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913830.147, "dur": 91.079, + "args": { + "External id": 446577,"Record function id": 0, "Sequence number": 5285587, "Fwd thread id": 1, "Ev Idx": 112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913831.788, "dur": 85.306, + "args": { + "External id": 446578,"Sequence number": 5285587, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 113 + } + }, + { + "ph": "f", "id": 14, "pid": 4183441, "tid": 31362, "ts": 676007913831.788, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007913835.164, "dur": 81.649, + "args": { + "External id": 446579,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007913836.154, "dur": 15.480, + "args": { + "External id": 446580,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007913836.885, "dur": 2.526, + "args": { + "External id": 446581,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007913840.108, "dur": 11.269, + "args": { + "External id": 446582,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007913840.937, "dur": 10.086, + "args": { + "External id": 446583,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007913853.911, "dur": 4.031, + "args": { + "External id": 446584,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007913857.258, "dur": 0.540, + "args": { + "External id": 446585,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007913858.491, "dur": 57.669, + "args": { + "External id": 446586,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913926.719, "dur": 76.515, + "args": { + "External id": 446587,"Record function id": 0, "Sequence number": 5285586, "Fwd thread id": 1, "Ev Idx": 122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007913927.783, "dur": 57.379, + "args": { + "External id": 446588,"Sequence number": 5285586, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 123 + } + }, + { + "ph": "f", "id": 15, "pid": 4183441, "tid": 31362, "ts": 676007913927.783, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007913930.561, "dur": 54.373, + "args": { + "External id": 446589,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007913931.626, "dur": 13.760, + "args": { + "External id": 446590,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007913932.354, "dur": 1.464, + "args": { + "External id": 446591,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007913934.550, "dur": 10.602, + "args": { + "External id": 446592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007913935.541, "dur": 9.332, + "args": { + "External id": 446593,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007913946.280, "dur": 1.819, + "args": { + "External id": 446594,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007913947.377, "dur": 0.585, + "args": { + "External id": 446595,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007913948.751, "dur": 35.646, + "args": { + "External id": 446596,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007913988.644, "dur": 13.226, + "args": { + "External id": 446597,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007914007.128, "dur": 36.244, + "args": { + "External id": 446598,"Record function id": 0, "Sequence number": 5285585, "Fwd thread id": 1, "Ev Idx": 133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007914009.710, "dur": 0.939, + "args": { + "External id": 446599,"Sequence number": 5285585, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 134 + } + }, + { + "ph": "f", "id": 16, "pid": 4183441, "tid": 31362, "ts": 676007914009.710, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007914013.116, "dur": 27.372, + "args": { + "External id": 446600,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007914014.681, "dur": 25.454, + "args": { + "External id": 446601,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007914021.860, "dur": 0.507, + "args": { + "External id": 446602,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007914047.804, "dur": 1470.148, + "args": { + "External id": 446603,"Record function id": 0, "Sequence number": 5285583, "Fwd thread id": 1, "Ev Idx": 138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007914051.136, "dur": 1439.349, + "args": { + "External id": 446604,"Sequence number": 5285583, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 139 + } + }, + { + "ph": "f", "id": 17, "pid": 4183441, "tid": 31362, "ts": 676007914051.136, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007914079.125, "dur": 14.775, + "args": { + "External id": 446605,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007914097.179, "dur": 1313.411, + "args": { + "External id": 446606,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007914098.606, "dur": 1311.733, + "args": { + "External id": 446607,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007914100.950, "dur": 5.421, + "args": { + "External id": 446608,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007914107.255, "dur": 1301.989, + "args": { + "External id": 446609,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183441, "tid": 31362, + "ts": 676007915413.562, "dur": 0.226, + "args": { + "External id": 446610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183441, "tid": 31362, + "ts": 676007915414.794, "dur": 2.218, + "args": { + "External id": 446611,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183441, "tid": 31362, + "ts": 676007915416.106, "dur": 0.772, + "args": { + "External id": 446612,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 31362, + "ts": 676007915420.322, "dur": 20.275, + "args": { + "External id": 446613,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183441, "tid": 31362, + "ts": 676007915447.016, "dur": 37.160, + "args": { + "External id": 446614,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 31362, + "ts": 676007915448.177, "dur": 35.834, + "args": { + "External id": 446615,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 31362, + "ts": 676007915450.864, "dur": 32.893, + "args": { + "External id": 446616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007915497.997, "dur": 16.666, + "args": { + "External id": 446617,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915527.187, "dur": 11.956, + "args": { + "External id": 446618,"Record function id": 0, "Sequence number": 5285582, "Fwd thread id": 1, "Ev Idx": 153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915528.692, "dur": 6.702, + "args": { + "External id": 446619,"Sequence number": 5285582, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 154 + } + }, + { + "ph": "f", "id": 18, "pid": 4183441, "tid": 31362, "ts": 676007915528.692, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007915531.312, "dur": 3.886, + "args": { + "External id": 446620,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007915532.315, "dur": 2.779, + "args": { + "External id": 446621,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915542.517, "dur": 64.300, + "args": { + "External id": 446622,"Record function id": 0, "Sequence number": 5285581, "Fwd thread id": 1, "Ev Idx": 157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915543.612, "dur": 57.567, + "args": { + "External id": 446623,"Sequence number": 5285581, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 158 + } + }, + { + "ph": "f", "id": 19, "pid": 4183441, "tid": 31362, "ts": 676007915543.612, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007915545.219, "dur": 55.640, + "args": { + "External id": 446624,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007915551.105, "dur": 19.884, + "args": { + "External id": 446625,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007915552.098, "dur": 2.500, + "args": { + "External id": 446626,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007915555.466, "dur": 15.238, + "args": { + "External id": 446627,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007915556.798, "dur": 13.457, + "args": { + "External id": 446628,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007915572.333, "dur": 4.245, + "args": { + "External id": 446629,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007915575.571, "dur": 0.802, + "args": { + "External id": 446630,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007915577.428, "dur": 22.766, + "args": { + "External id": 446631,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915610.664, "dur": 79.613, + "args": { + "External id": 446632,"Record function id": 0, "Sequence number": 5285580, "Fwd thread id": 1, "Ev Idx": 167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915611.668, "dur": 73.666, + "args": { + "External id": 446633,"Sequence number": 5285580, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 168 + } + }, + { + "ph": "f", "id": 20, "pid": 4183441, "tid": 31362, "ts": 676007915611.668, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183441, "tid": 31362, + "ts": 676007915613.431, "dur": 71.569, + "args": { + "External id": 446634,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007915614.850, "dur": 18.666, + "args": { + "External id": 446635,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007915617.461, "dur": 2.081, + "args": { + "External id": 446636,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007915620.183, "dur": 13.090, + "args": { + "External id": 446637,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007915621.062, "dur": 11.827, + "args": { + "External id": 446638,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007915634.380, "dur": 7.519, + "args": { + "External id": 446639,"Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007915638.897, "dur": 2.599, + "args": { + "External id": 446640,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007915642.646, "dur": 41.507, + "args": { + "External id": 446641,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915695.708, "dur": 76.833, + "args": { + "External id": 446642,"Record function id": 0, "Sequence number": 5285579, "Fwd thread id": 1, "Ev Idx": 177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915696.912, "dur": 72.613, + "args": { + "External id": 446643,"Sequence number": 5285579, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 178 + } + }, + { + "ph": "f", "id": 21, "pid": 4183441, "tid": 31362, "ts": 676007915696.912, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007915698.954, "dur": 70.254, + "args": { + "External id": 446644,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007915700.256, "dur": 23.261, + "args": { + "External id": 446645,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007915702.972, "dur": 2.613, + "args": { + "External id": 446646,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007915706.439, "dur": 16.778, + "args": { + "External id": 446647,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007915707.197, "dur": 15.614, + "args": { + "External id": 446648,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007915724.410, "dur": 4.129, + "args": { + "External id": 446649,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007915727.657, "dur": 0.666, + "args": { + "External id": 446650,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007915729.292, "dur": 39.243, + "args": { + "External id": 446651,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915776.475, "dur": 80.870, + "args": { + "External id": 446652,"Record function id": 0, "Sequence number": 5285578, "Fwd thread id": 1, "Ev Idx": 187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915777.449, "dur": 62.210, + "args": { + "External id": 446653,"Sequence number": 5285578, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 188 + } + }, + { + "ph": "f", "id": 22, "pid": 4183441, "tid": 31362, "ts": 676007915777.449, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007915780.641, "dur": 58.769, + "args": { + "External id": 446654,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007915781.623, "dur": 17.048, + "args": { + "External id": 446655,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007915783.914, "dur": 1.819, + "args": { + "External id": 446656,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007915786.382, "dur": 12.019, + "args": { + "External id": 446657,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007915787.027, "dur": 11.000, + "args": { + "External id": 446658,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007915799.389, "dur": 1.736, + "args": { + "External id": 446659,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007915800.384, "dur": 0.598, + "args": { + "External id": 446660,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007915801.963, "dur": 36.893, + "args": { + "External id": 446661,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007915842.716, "dur": 13.348, + "args": { + "External id": 446662,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915860.726, "dur": 32.556, + "args": { + "External id": 446663,"Record function id": 0, "Sequence number": 5285577, "Fwd thread id": 1, "Ev Idx": 198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007915861.809, "dur": 0.874, + "args": { + "External id": 446664,"Sequence number": 5285577, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 199 + } + }, + { + "ph": "f", "id": 23, "pid": 4183441, "tid": 31362, "ts": 676007915861.809, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007915864.120, "dur": 23.700, + "args": { + "External id": 446665,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007915867.128, "dur": 20.391, + "args": { + "External id": 446666,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007915870.893, "dur": 0.457, + "args": { + "External id": 446667,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007915897.324, "dur": 1467.073, + "args": { + "External id": 446668,"Record function id": 0, "Sequence number": 5285576, "Fwd thread id": 1, "Ev Idx": 203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007915909.139, "dur": 1426.335, + "args": { + "External id": 446669,"Sequence number": 5285576, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 204 + } + }, + { + "ph": "f", "id": 24, "pid": 4183441, "tid": 31362, "ts": 676007915909.139, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007915933.901, "dur": 1.902, + "args": { + "External id": 446670,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007915937.608, "dur": 1316.104, + "args": { + "External id": 446671,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007915938.660, "dur": 1314.806, + "args": { + "External id": 446672,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007915940.393, "dur": 2.657, + "args": { + "External id": 446673,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007915943.864, "dur": 1308.261, + "args": { + "External id": 446674,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 4183441, "tid": 31362, + "ts": 676007917258.594, "dur": 0.404, + "args": { + "External id": 446675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 4183441, "tid": 31362, + "ts": 676007917260.082, "dur": 2.347, + "args": { + "External id": 446676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 4183441, "tid": 31362, + "ts": 676007917261.596, "dur": 0.693, + "args": { + "External id": 446677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 31362, + "ts": 676007917265.732, "dur": 22.265, + "args": { + "External id": 446678,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183441, "tid": 31362, + "ts": 676007917291.980, "dur": 37.678, + "args": { + "External id": 446679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 31362, + "ts": 676007917292.790, "dur": 36.702, + "args": { + "External id": 446680,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 31362, + "ts": 676007917293.802, "dur": 35.405, + "args": { + "External id": 446681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007917345.720, "dur": 14.684, + "args": { + "External id": 446682,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007917374.914, "dur": 11.650, + "args": { + "External id": 446683,"Record function id": 0, "Ev Idx": 218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007917377.363, "dur": 7.657, + "args": { + "External id": 446684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007917380.588, "dur": 3.454, + "args": { + "External id": 446685,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007917381.210, "dur": 2.727, + "args": { + "External id": 446686,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917389.898, "dur": 9.098, + "args": { + "External id": 446687,"Record function id": 0, "Sequence number": 5285575, "Fwd thread id": 1, "Ev Idx": 222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917391.067, "dur": 5.502, + "args": { + "External id": 446688,"Sequence number": 5285575, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 223 + } + }, + { + "ph": "f", "id": 25, "pid": 4183441, "tid": 31362, "ts": 676007917391.067, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007917393.054, "dur": 3.316, + "args": { + "External id": 446689,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007917394.004, "dur": 2.248, + "args": { + "External id": 446690,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917402.056, "dur": 62.083, + "args": { + "External id": 446691,"Record function id": 0, "Sequence number": 5285574, "Fwd thread id": 1, "Ev Idx": 226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917403.137, "dur": 55.296, + "args": { + "External id": 446692,"Sequence number": 5285574, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 227 + } + }, + { + "ph": "f", "id": 26, "pid": 4183441, "tid": 31362, "ts": 676007917403.137, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007917406.763, "dur": 51.356, + "args": { + "External id": 446693,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007917410.720, "dur": 19.119, + "args": { + "External id": 446694,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007917411.670, "dur": 2.436, + "args": { + "External id": 446695,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007917414.854, "dur": 14.645, + "args": { + "External id": 446696,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007917416.025, "dur": 12.939, + "args": { + "External id": 446697,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007917431.026, "dur": 4.234, + "args": { + "External id": 446698,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007917434.279, "dur": 0.787, + "args": { + "External id": 446699,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[4194304, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007917435.992, "dur": 21.417, + "args": { + "External id": 446700,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917469.670, "dur": 54.452, + "args": { + "External id": 446701,"Record function id": 0, "Sequence number": 5285573, "Fwd thread id": 1, "Ev Idx": 236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917470.978, "dur": 49.921, + "args": { + "External id": 446702,"Sequence number": 5285573, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 237 + } + }, + { + "ph": "f", "id": 27, "pid": 4183441, "tid": 31362, "ts": 676007917470.978, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 4183441, "tid": 31362, + "ts": 676007917472.690, "dur": 47.936, + "args": { + "External id": 446703,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "2", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007917473.941, "dur": 20.176, + "args": { + "External id": 446704,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007917478.320, "dur": 2.195, + "args": { + "External id": 446705,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007917481.407, "dur": 12.457, + "args": { + "External id": 446706,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007917482.375, "dur": 11.184, + "args": { + "External id": 446707,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007917494.976, "dur": 5.907, + "args": { + "External id": 446708,"Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007917499.528, "dur": 0.941, + "args": { + "External id": 446709,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007917501.499, "dur": 18.577, + "args": { + "External id": 446710,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917527.893, "dur": 71.694, + "args": { + "External id": 446711,"Record function id": 0, "Sequence number": 5285572, "Fwd thread id": 1, "Ev Idx": 246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917528.894, "dur": 68.149, + "args": { + "External id": 446712,"Sequence number": 5285572, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 247 + } + }, + { + "ph": "f", "id": 28, "pid": 4183441, "tid": 31362, "ts": 676007917528.894, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007917529.880, "dur": 66.850, + "args": { + "External id": 446713,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007917530.823, "dur": 20.283, + "args": { + "External id": 446714,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007917535.359, "dur": 1.617, + "args": { + "External id": 446715,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007917537.632, "dur": 13.231, + "args": { + "External id": 446716,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007917538.370, "dur": 12.077, + "args": { + "External id": 446717,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007917551.948, "dur": 3.389, + "args": { + "External id": 446718,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007917553.019, "dur": 2.149, + "args": { + "External id": 446719,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007917555.759, "dur": 40.379, + "args": { + "External id": 446720,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917603.143, "dur": 120.910, + "args": { + "External id": 446721,"Record function id": 0, "Sequence number": 5285571, "Fwd thread id": 1, "Ev Idx": 256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007917604.111, "dur": 94.942, + "args": { + "External id": 446722,"Sequence number": 5285571, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 257 + } + }, + { + "ph": "f", "id": 29, "pid": 4183441, "tid": 31362, "ts": 676007917604.111, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 4183441, "tid": 31362, + "ts": 676007917605.409, "dur": 93.268, + "args": { + "External id": 446723,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], [], []], "Ev Idx": 258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 31362, + "ts": 676007917606.568, "dur": 24.119, + "args": { + "External id": 446724,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007917611.013, "dur": 1.663, + "args": { + "External id": 446725,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 1024]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 31362, + "ts": 676007917615.709, "dur": 14.706, + "args": { + "External id": 446726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 31362, + "ts": 676007917618.367, "dur": 11.633, + "args": { + "External id": 446727,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], []], "Ev Idx": 262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007917631.357, "dur": 3.622, + "args": { + "External id": 446728,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007917634.040, "dur": 0.785, + "args": { + "External id": 446729,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007917635.522, "dur": 61.958, + "args": { + "External id": 446730,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007917703.895, "dur": 18.075, + "args": { + "External id": 446731,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [16777216, 4096, 1024, 1], []], "Input Dims": [[16, 4096, 4, 1024], [16, 4096, 4, 1024], []], "Ev Idx": 266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007917731.269, "dur": 384.205, + "args": { + "External id": 446732,"Record function id": 0, "Sequence number": 5285570, "Fwd thread id": 1, "Ev Idx": 267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007917732.929, "dur": 369.313, + "args": { + "External id": 446733,"Sequence number": 5285570, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 268 + } + }, + { + "ph": "f", "id": 30, "pid": 4183441, "tid": 31362, "ts": 676007917732.929, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676007917910.626, "dur": 46.007, + "args": { + "External id": 446734,"kernel_hash": "cxdhjwvz2zq5a6tr3csmr5qtuhxtrqagqlybbtuuwjocpwkglula", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "262144", "1024", "1", "1986", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xd/cxdhjwvz2zq5a6tr3csmr5qtuhxtrqagqlybbtuuwjocpwkglula.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 1024], [1024], [262144, 1024], [262144, 1024], [132, 1024], [262144], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_0", "pid": 4183441, "tid": 31362, + "ts": 676007917988.511, "dur": 28.460, + "args": { + "External id": 446735,"kernel_hash": "ctkdkix3f4a6v32mvgnxj3riqytga3v4xc7aah43z34hudbmfkbl", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/tk/ctkdkix3f4a6v32mvgnxj3riqytga3v4xc7aah43z34hudbmfkbl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_1", "pid": 4183441, "tid": 31362, + "ts": 676007918038.073, "dur": 23.843, + "args": { + "External id": 446736,"kernel_hash": "cez57yhbmcqsgpjextfoqzmflfbildq4izneuaqtyn74lue5fgwg", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/ez/cez57yhbmcqsgpjextfoqzmflfbildq4izneuaqtyn74lue5fgwg.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007918126.535, "dur": 10.757, + "args": { + "External id": 446737,"Record function id": 0, "Ev Idx": 272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007918128.587, "dur": 8.026, + "args": { + "External id": 446738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007918131.601, "dur": 4.109, + "args": { + "External id": 446739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007918132.579, "dur": 2.966, + "args": { + "External id": 446740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: StackBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918143.083, "dur": 34.201, + "args": { + "External id": 446741,"Record function id": 0, "Sequence number": 5285569, "Fwd thread id": 1, "Ev Idx": 276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "StackBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918144.186, "dur": 21.693, + "args": { + "External id": 446742,"Sequence number": 5285569, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1024, 1]], "Input Dims": [[16, 4096, 4, 1024]], "Ev Idx": 277 + } + }, + { + "ph": "f", "id": 31, "pid": 4183441, "tid": 31362, "ts": 676007918144.186, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007918146.394, "dur": 7.102, + "args": { + "External id": 446743,"Record function id": 0, "Concrete Inputs": ["", "-2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918150.595, "dur": 1.331, + "args": { + "External id": 446744,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007918154.185, "dur": 4.025, + "args": { + "External id": 446745,"Record function id": 0, "Concrete Inputs": ["", "-2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918156.871, "dur": 0.622, + "args": { + "External id": 446746,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007918158.715, "dur": 2.023, + "args": { + "External id": 446747,"Record function id": 0, "Concrete Inputs": ["", "-2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918159.718, "dur": 0.343, + "args": { + "External id": 446748,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 31362, + "ts": 676007918161.241, "dur": 4.077, + "args": { + "External id": 446749,"Record function id": 0, "Concrete Inputs": ["", "-2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918164.099, "dur": 0.468, + "args": { + "External id": 446750,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918181.090, "dur": 6.859, + "args": { + "External id": 446751,"Record function id": 0, "Sequence number": 5285568, "Fwd thread id": 1, "Ev Idx": 286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918181.891, "dur": 1.049, + "args": { + "External id": 446752,"Sequence number": 5285568, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 287 + } + }, + { + "ph": "f", "id": 32, "pid": 4183441, "tid": 31362, "ts": 676007918181.891, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007918192.261, "dur": 563.389, + "args": { + "External id": 446753,"Record function id": 0, "Sequence number": 5285567, "Fwd thread id": 1, "Ev Idx": 288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007918193.449, "dur": 546.823, + "args": { + "External id": 446754,"Sequence number": 5285567, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 289 + } + }, + { + "ph": "f", "id": 33, "pid": 4183441, "tid": 31362, "ts": 676007918193.449, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007918236.173, "dur": 12.198, + "args": { + "External id": 446755,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007918244.140, "dur": 3.944, + "args": { + "External id": 446756,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007918253.953, "dur": 10.474, + "args": { + "External id": 446757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007918257.498, "dur": 6.000, + "args": { + "External id": 446758,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918260.811, "dur": 2.476, + "args": { + "External id": 446759,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 31362, + "ts": 676007918270.105, "dur": 127.545, + "args": { + "External id": 446760,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007918271.258, "dur": 3.270, + "args": { + "External id": 446761,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007918272.107, "dur": 1.672, + "args": { + "External id": 446762,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918273.232, "dur": 0.388, + "args": { + "External id": 446763,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 31362, + "ts": 676007918276.695, "dur": 120.169, + "args": { + "External id": 446764,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007918279.353, "dur": 116.561, + "args": { + "External id": 446765,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007918405.923, "dur": 5.773, + "args": { + "External id": 446766,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918408.956, "dur": 2.622, + "args": { + "External id": 446767,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007918452.299, "dur": 5.193, + "args": { + "External id": 446768,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007918458.385, "dur": 2.268, + "args": { + "External id": 446769,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007918461.373, "dur": 1.718, + "args": { + "External id": 446770,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007918504.159, "dur": 2.698, + "args": { + "External id": 446771,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918504.906, "dur": 1.797, + "args": { + "External id": 446772,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183441, "tid": 31362, + "ts": 676007918535.503, "dur": 179.616, + "args": { + "External id": 446773,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007918543.296, "dur": 8.657, + "args": { + "External id": 446774,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918546.375, "dur": 2.680, + "args": { + "External id": 446775,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007918556.119, "dur": 6.250, + "args": { + "External id": 446776,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918560.956, "dur": 0.606, + "args": { + "External id": 446777,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007918563.704, "dur": 3.372, + "args": { + "External id": 446778,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918566.254, "dur": 0.457, + "args": { + "External id": 446779,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007918567.798, "dur": 4.201, + "args": { + "External id": 446780,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918570.915, "dur": 0.592, + "args": { + "External id": 446781,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007918578.067, "dur": 4.048, + "args": { + "External id": 446782,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918580.998, "dur": 0.825, + "args": { + "External id": 446783,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007918582.844, "dur": 6.321, + "args": { + "External id": 446784,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007918587.286, "dur": 1.662, + "args": { + "External id": 446785,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007918589.875, "dur": 1.563, + "args": { + "External id": 446786,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918590.646, "dur": 0.529, + "args": { + "External id": 446787,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007918593.986, "dur": 1.950, + "args": { + "External id": 446788,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918594.492, "dur": 1.367, + "args": { + "External id": 446789,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676007918597.898, "dur": 102.501, + "args": { + "External id": 446790,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918703.611, "dur": 1.581, + "args": { + "External id": 446791,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007918706.061, "dur": 4.837, + "args": { + "External id": 446792,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918709.461, "dur": 0.586, + "args": { + "External id": 446793,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918713.058, "dur": 0.921, + "args": { + "External id": 446794,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007918768.133, "dur": 10.288, + "args": { + "External id": 446795,"Record function id": 0, "Ev Idx": 330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007918770.264, "dur": 7.417, + "args": { + "External id": 446796,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007918772.985, "dur": 3.920, + "args": { + "External id": 446797,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007918774.269, "dur": 2.535, + "args": { + "External id": 446798,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918782.195, "dur": 10.383, + "args": { + "External id": 446799,"Record function id": 0, "Sequence number": 5285566, "Fwd thread id": 1, "Ev Idx": 334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918783.186, "dur": 6.009, + "args": { + "External id": 446800,"Sequence number": 5285566, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 335 + } + }, + { + "ph": "f", "id": 34, "pid": 4183441, "tid": 31362, "ts": 676007918783.186, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007918785.155, "dur": 3.814, + "args": { + "External id": 446801,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918787.944, "dur": 0.892, + "args": { + "External id": 446802,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918796.065, "dur": 137.772, + "args": { + "External id": 446803,"Record function id": 0, "Sequence number": 5285565, "Fwd thread id": 1, "Ev Idx": 338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918798.999, "dur": 126.649, + "args": { + "External id": 446804,"Sequence number": 5285565, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 339 + } + }, + { + "ph": "f", "id": 35, "pid": 4183441, "tid": 31362, "ts": 676007918798.999, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007918804.316, "dur": 4.318, + "args": { + "External id": 446805,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007918805.734, "dur": 2.329, + "args": { + "External id": 446806,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918807.231, "dur": 0.611, + "args": { + "External id": 446807,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007918810.037, "dur": 51.454, + "args": { + "External id": 446808,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007918862.531, "dur": 5.922, + "args": { + "External id": 446809,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007918863.345, "dur": 4.432, + "args": { + "External id": 446810,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918866.597, "dur": 0.978, + "args": { + "External id": 446811,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007918870.233, "dur": 6.706, + "args": { + "External id": 446812,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007918871.350, "dur": 5.113, + "args": { + "External id": 446813,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918874.146, "dur": 2.176, + "args": { + "External id": 446814,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007918877.638, "dur": 47.306, + "args": { + "External id": 446815,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918938.182, "dur": 8.692, + "args": { + "External id": 446816,"Record function id": 0, "Sequence number": 5285564, "Fwd thread id": 1, "Ev Idx": 351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918939.053, "dur": 5.786, + "args": { + "External id": 446817,"Sequence number": 5285564, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 352 + } + }, + { + "ph": "f", "id": 36, "pid": 4183441, "tid": 31362, "ts": 676007918939.053, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007918941.221, "dur": 3.477, + "args": { + "External id": 446818,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918943.306, "dur": 1.299, + "args": { + "External id": 446819,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918950.474, "dur": 8.352, + "args": { + "External id": 446820,"Record function id": 0, "Sequence number": 5285563, "Fwd thread id": 1, "Ev Idx": 355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918951.566, "dur": 4.419, + "args": { + "External id": 446821,"Sequence number": 5285563, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 356 + } + }, + { + "ph": "f", "id": 37, "pid": 4183441, "tid": 31362, "ts": 676007918951.566, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007918952.529, "dur": 3.235, + "args": { + "External id": 446822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007918953.551, "dur": 1.726, + "args": { + "External id": 446823,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918954.597, "dur": 0.528, + "args": { + "External id": 446824,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007918964.097, "dur": 4.940, + "args": { + "External id": 446825,"Record function id": 0, "Ev Idx": 360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007918965.370, "dur": 3.106, + "args": { + "External id": 446826,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007918966.545, "dur": 1.585, + "args": { + "External id": 446827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007918966.995, "dur": 1.055, + "args": { + "External id": 446828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918972.254, "dur": 8.933, + "args": { + "External id": 446829,"Record function id": 0, "Sequence number": 5285562, "Fwd thread id": 1, "Ev Idx": 364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918973.215, "dur": 4.360, + "args": { + "External id": 446830,"Sequence number": 5285562, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 365 + } + }, + { + "ph": "f", "id": 38, "pid": 4183441, "tid": 31362, "ts": 676007918973.215, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007918976.152, "dur": 1.302, + "args": { + "External id": 446831,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007918976.655, "dur": 0.673, + "args": { + "External id": 446832,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918984.196, "dur": 113.579, + "args": { + "External id": 446833,"Record function id": 0, "Sequence number": 5285561, "Fwd thread id": 1, "Ev Idx": 368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007918985.175, "dur": 88.034, + "args": { + "External id": 446834,"Sequence number": 5285561, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 369 + } + }, + { + "ph": "f", "id": 39, "pid": 4183441, "tid": 31362, "ts": 676007918985.175, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007918988.321, "dur": 4.399, + "args": { + "External id": 446835,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007918989.116, "dur": 3.185, + "args": { + "External id": 446836,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007918991.608, "dur": 0.595, + "args": { + "External id": 446837,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007918993.376, "dur": 28.269, + "args": { + "External id": 446838,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007919022.608, "dur": 5.820, + "args": { + "External id": 446839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007919023.173, "dur": 4.672, + "args": { + "External id": 446840,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919025.441, "dur": 2.273, + "args": { + "External id": 446841,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007919029.456, "dur": 4.793, + "args": { + "External id": 446842,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007919030.423, "dur": 3.364, + "args": { + "External id": 446843,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919033.038, "dur": 0.645, + "args": { + "External id": 446844,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007919034.827, "dur": 37.622, + "args": { + "External id": 446845,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919106.922, "dur": 43.222, + "args": { + "External id": 446846,"Record function id": 0, "Sequence number": 5285560, "Fwd thread id": 1, "Ev Idx": 381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919108.102, "dur": 5.774, + "args": { + "External id": 446847,"Sequence number": 5285560, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 382 + } + }, + { + "ph": "f", "id": 40, "pid": 4183441, "tid": 31362, "ts": 676007919108.102, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919109.703, "dur": 4.015, + "args": { + "External id": 446848,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919112.050, "dur": 1.576, + "args": { + "External id": 446849,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007919118.929, "dur": 28.269, + "args": { + "External id": 446850,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919153.947, "dur": 11.226, + "args": { + "External id": 446851,"Record function id": 0, "Sequence number": 5285559, "Fwd thread id": 1, "Ev Idx": 386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919155.223, "dur": 6.736, + "args": { + "External id": 446852,"Sequence number": 5285559, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 387 + } + }, + { + "ph": "f", "id": 41, "pid": 4183441, "tid": 31362, "ts": 676007919155.223, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007919158.360, "dur": 3.401, + "args": { + "External id": 446853,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007919159.384, "dur": 1.784, + "args": { + "External id": 446854,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919160.489, "dur": 0.578, + "args": { + "External id": 446855,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007919169.324, "dur": 5.420, + "args": { + "External id": 446856,"Record function id": 0, "Ev Idx": 391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007919170.573, "dur": 3.662, + "args": { + "External id": 446857,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007919171.728, "dur": 2.078, + "args": { + "External id": 446858,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007919172.267, "dur": 1.462, + "args": { + "External id": 446859,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007919178.886, "dur": 463.720, + "args": { + "External id": 446860,"Record function id": 0, "Sequence number": 5285558, "Fwd thread id": 1, "Ev Idx": 395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007919180.271, "dur": 446.157, + "args": { + "External id": 446861,"Sequence number": 5285558, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 396 + } + }, + { + "ph": "f", "id": 42, "pid": 4183441, "tid": 31362, "ts": 676007919180.271, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 31362, + "ts": 676007919208.543, "dur": 36.077, + "args": { + "External id": 446862,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007919210.558, "dur": 33.844, + "args": { + "External id": 446863,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007919215.183, "dur": 5.759, + "args": { + "External id": 446864,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007919217.764, "dur": 2.698, + "args": { + "External id": 446865,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007919222.310, "dur": 21.626, + "args": { + "External id": 446866,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919259.170, "dur": 4.127, + "args": { + "External id": 446867,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919260.074, "dur": 3.127, + "args": { + "External id": 446868,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919267.323, "dur": 1.773, + "args": { + "External id": 446869,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919268.218, "dur": 0.782, + "args": { + "External id": 446870,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007919285.486, "dur": 2.386, + "args": { + "External id": 446871,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007919302.678, "dur": 3.177, + "args": { + "External id": 446872,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919513.605, "dur": 2.560, + "args": { + "External id": 446873,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007919520.891, "dur": 34.206, + "args": { + "External id": 446874,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919530.781, "dur": 0.908, + "args": { + "External id": 446875,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007919561.719, "dur": 31.580, + "args": { + "External id": 446876,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007919563.557, "dur": 29.505, + "args": { + "External id": 446877,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919567.825, "dur": 3.938, + "args": { + "External id": 446878,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007919574.794, "dur": 17.772, + "args": { + "External id": 446879,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007919597.792, "dur": 2.478, + "args": { + "External id": 446880,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919598.915, "dur": 1.224, + "args": { + "External id": 446881,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919605.836, "dur": 5.987, + "args": { + "External id": 446882,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919608.638, "dur": 2.988, + "args": { + "External id": 446883,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919613.680, "dur": 1.345, + "args": { + "External id": 446884,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919614.083, "dur": 0.855, + "args": { + "External id": 446885,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007919691.443, "dur": 12.399, + "args": { + "External id": 446886,"Record function id": 0, "Ev Idx": 421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007919694.898, "dur": 7.766, + "args": { + "External id": 446887,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007919697.574, "dur": 3.591, + "args": { + "External id": 446888,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007919698.567, "dur": 2.352, + "args": { + "External id": 446889,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919708.674, "dur": 10.823, + "args": { + "External id": 446890,"Record function id": 0, "Sequence number": 5285557, "Fwd thread id": 1, "Ev Idx": 425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919709.962, "dur": 6.365, + "args": { + "External id": 446891,"Sequence number": 5285557, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 426 + } + }, + { + "ph": "f", "id": 43, "pid": 4183441, "tid": 31362, "ts": 676007919709.962, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919711.625, "dur": 4.489, + "args": { + "External id": 446892,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919714.160, "dur": 1.809, + "args": { + "External id": 446893,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919724.767, "dur": 152.314, + "args": { + "External id": 446894,"Record function id": 0, "Sequence number": 5285556, "Fwd thread id": 1, "Ev Idx": 429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919725.838, "dur": 145.100, + "args": { + "External id": 446895,"Sequence number": 5285556, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 430 + } + }, + { + "ph": "f", "id": 44, "pid": 4183441, "tid": 31362, "ts": 676007919725.838, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007919729.829, "dur": 5.175, + "args": { + "External id": 446896,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007919731.586, "dur": 2.724, + "args": { + "External id": 446897,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919732.999, "dur": 1.084, + "args": { + "External id": 446898,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007919736.327, "dur": 80.061, + "args": { + "External id": 446899,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007919817.623, "dur": 7.236, + "args": { + "External id": 446900,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007919820.249, "dur": 3.906, + "args": { + "External id": 446901,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919821.477, "dur": 2.512, + "args": { + "External id": 446902,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007919826.615, "dur": 5.797, + "args": { + "External id": 446903,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007919828.130, "dur": 3.798, + "args": { + "External id": 446904,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919831.150, "dur": 0.687, + "args": { + "External id": 446905,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007919833.151, "dur": 37.002, + "args": { + "External id": 446906,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919881.940, "dur": 12.671, + "args": { + "External id": 446907,"Record function id": 0, "Sequence number": 5285555, "Fwd thread id": 1, "Ev Idx": 442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919883.500, "dur": 7.980, + "args": { + "External id": 446908,"Sequence number": 5285555, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 443 + } + }, + { + "ph": "f", "id": 45, "pid": 4183441, "tid": 31362, "ts": 676007919883.500, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919887.415, "dur": 3.920, + "args": { + "External id": 446909,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919888.235, "dur": 2.987, + "args": { + "External id": 446910,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919898.270, "dur": 7.789, + "args": { + "External id": 446911,"Record function id": 0, "Sequence number": 5285554, "Fwd thread id": 1, "Ev Idx": 446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919899.208, "dur": 4.040, + "args": { + "External id": 446912,"Sequence number": 5285554, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 447 + } + }, + { + "ph": "f", "id": 46, "pid": 4183441, "tid": 31362, "ts": 676007919899.208, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007919900.520, "dur": 2.494, + "args": { + "External id": 446913,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007919901.137, "dur": 1.421, + "args": { + "External id": 446914,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919902.048, "dur": 0.406, + "args": { + "External id": 446915,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007919912.055, "dur": 7.168, + "args": { + "External id": 446916,"Record function id": 0, "Ev Idx": 451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007919913.518, "dur": 5.214, + "args": { + "External id": 446917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007919914.791, "dur": 3.632, + "args": { + "External id": 446918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007919917.052, "dur": 1.264, + "args": { + "External id": 446919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919922.254, "dur": 7.403, + "args": { + "External id": 446920,"Record function id": 0, "Sequence number": 5285553, "Fwd thread id": 1, "Ev Idx": 455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007919923.221, "dur": 3.596, + "args": { + "External id": 446921,"Sequence number": 5285553, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 456 + } + }, + { + "ph": "f", "id": 47, "pid": 4183441, "tid": 31362, "ts": 676007919923.221, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007919924.679, "dur": 1.997, + "args": { + "External id": 446922,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007919925.276, "dur": 1.257, + "args": { + "External id": 446923,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007919934.238, "dur": 350.744, + "args": { + "External id": 446924,"Record function id": 0, "Sequence number": 5285552, "Fwd thread id": 1, "Ev Idx": 459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007919935.458, "dur": 326.351, + "args": { + "External id": 446925,"Sequence number": 5285552, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 460 + } + }, + { + "ph": "f", "id": 48, "pid": 4183441, "tid": 31362, "ts": 676007919935.458, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007919956.306, "dur": 10.909, + "args": { + "External id": 446926,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919962.922, "dur": 3.789, + "args": { + "External id": 446927,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007919969.658, "dur": 3.087, + "args": { + "External id": 446928,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919970.507, "dur": 2.018, + "args": { + "External id": 446929,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007919974.416, "dur": 5.662, + "args": { + "External id": 446930,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007919977.029, "dur": 2.824, + "args": { + "External id": 446931,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676007920011.540, "dur": 223.154, + "args": { + "External id": 446932,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007920133.571, "dur": 4.750, + "args": { + "External id": 446933,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007920140.070, "dur": 3.867, + "args": { + "External id": 446934,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007920248.711, "dur": 4.062, + "args": { + "External id": 446935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007920255.743, "dur": 0.688, + "args": { + "External id": 446936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007920258.347, "dur": 0.607, + "args": { + "External id": 446937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007920294.502, "dur": 238.283, + "args": { + "External id": 446938,"Record function id": 0, "Sequence number": 5285551, "Fwd thread id": 1, "Ev Idx": 473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007920296.149, "dur": 228.594, + "args": { + "External id": 446939,"Sequence number": 5285551, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 474 + } + }, + { + "ph": "f", "id": 49, "pid": 4183441, "tid": 31362, "ts": 676007920296.149, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007920322.047, "dur": 41.315, + "args": { + "External id": 446940,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920326.590, "dur": 2.822, + "args": { + "External id": 446941,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007920331.034, "dur": 31.724, + "args": { + "External id": 446942,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007920375.284, "dur": 3.508, + "args": { + "External id": 446943,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920376.555, "dur": 1.902, + "args": { + "External id": 446944,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007920539.654, "dur": 192.794, + "args": { + "External id": 446945,"Record function id": 0, "Sequence number": 5285550, "Fwd thread id": 1, "Ev Idx": 480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007920541.134, "dur": 183.267, + "args": { + "External id": 446946,"Sequence number": 5285550, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 481 + } + }, + { + "ph": "f", "id": 50, "pid": 4183441, "tid": 31362, "ts": 676007920541.134, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007920553.458, "dur": 28.452, + "args": { + "External id": 446947,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920555.460, "dur": 2.487, + "args": { + "External id": 446948,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007920559.051, "dur": 22.278, + "args": { + "External id": 446949,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007920590.853, "dur": 5.118, + "args": { + "External id": 446950,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920591.980, "dur": 3.708, + "args": { + "External id": 446951,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920741.328, "dur": 14.847, + "args": { + "External id": 446952,"Record function id": 0, "Sequence number": 5285549, "Fwd thread id": 1, "Ev Idx": 487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920742.897, "dur": 10.351, + "args": { + "External id": 446953,"Sequence number": 5285549, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 488 + } + }, + { + "ph": "f", "id": 51, "pid": 4183441, "tid": 31362, "ts": 676007920742.897, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007920745.423, "dur": 7.545, + "args": { + "External id": 446954,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007920746.693, "dur": 6.053, + "args": { + "External id": 446955,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920759.639, "dur": 7.760, + "args": { + "External id": 446956,"Record function id": 0, "Sequence number": 5285548, "Fwd thread id": 1, "Ev Idx": 491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920760.516, "dur": 4.765, + "args": { + "External id": 446957,"Sequence number": 5285548, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 492 + } + }, + { + "ph": "f", "id": 52, "pid": 4183441, "tid": 31362, "ts": 676007920760.516, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007920763.528, "dur": 1.607, + "args": { + "External id": 446958,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007920764.116, "dur": 0.876, + "args": { + "External id": 446959,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920770.388, "dur": 7.296, + "args": { + "External id": 446960,"Record function id": 0, "Sequence number": 5285547, "Fwd thread id": 1, "Ev Idx": 495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920772.799, "dur": 2.904, + "args": { + "External id": 446961,"Sequence number": 5285547, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 496 + } + }, + { + "ph": "f", "id": 53, "pid": 4183441, "tid": 31362, "ts": 676007920772.799, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007920774.046, "dur": 1.509, + "args": { + "External id": 446962,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007920774.674, "dur": 0.749, + "args": { + "External id": 446963,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920780.966, "dur": 8.193, + "args": { + "External id": 446964,"Record function id": 0, "Sequence number": 5285546, "Fwd thread id": 1, "Ev Idx": 499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920784.087, "dur": 2.946, + "args": { + "External id": 446965,"Sequence number": 5285546, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 500 + } + }, + { + "ph": "f", "id": 54, "pid": 4183441, "tid": 31362, "ts": 676007920784.087, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007920785.427, "dur": 1.469, + "args": { + "External id": 446966,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007920785.913, "dur": 0.883, + "args": { + "External id": 446967,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920792.398, "dur": 182.279, + "args": { + "External id": 446968,"Record function id": 0, "Sequence number": 5285545, "Fwd thread id": 1, "Ev Idx": 503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920793.366, "dur": 173.384, + "args": { + "External id": 446969,"Sequence number": 5285545, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 504 + } + }, + { + "ph": "f", "id": 55, "pid": 4183441, "tid": 31362, "ts": 676007920793.366, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007920800.519, "dur": 6.739, + "args": { + "External id": 446970,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007920802.810, "dur": 3.781, + "args": { + "External id": 446971,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920804.839, "dur": 1.460, + "args": { + "External id": 446972,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007920808.774, "dur": 82.017, + "args": { + "External id": 446973,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007920892.204, "dur": 6.244, + "args": { + "External id": 446974,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007920893.100, "dur": 4.715, + "args": { + "External id": 446975,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920896.215, "dur": 1.430, + "args": { + "External id": 446976,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007920917.265, "dur": 4.233, + "args": { + "External id": 446977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007920918.314, "dur": 2.733, + "args": { + "External id": 446978,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920920.532, "dur": 0.414, + "args": { + "External id": 446979,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007920922.084, "dur": 43.625, + "args": { + "External id": 446980,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920979.612, "dur": 6.937, + "args": { + "External id": 446981,"Record function id": 0, "Sequence number": 5285544, "Fwd thread id": 1, "Ev Idx": 516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920980.544, "dur": 3.331, + "args": { + "External id": 446982,"Sequence number": 5285544, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 517 + } + }, + { + "ph": "f", "id": 56, "pid": 4183441, "tid": 31362, "ts": 676007920980.544, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007920981.908, "dur": 1.820, + "args": { + "External id": 446983,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007920982.409, "dur": 1.220, + "args": { + "External id": 446984,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920989.679, "dur": 9.875, + "args": { + "External id": 446985,"Record function id": 0, "Sequence number": 5285543, "Fwd thread id": 1, "Ev Idx": 520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007920992.870, "dur": 4.768, + "args": { + "External id": 446986,"Sequence number": 5285543, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 521 + } + }, + { + "ph": "f", "id": 57, "pid": 4183441, "tid": 31362, "ts": 676007920992.870, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007920993.791, "dur": 3.637, + "args": { + "External id": 446987,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007920994.381, "dur": 2.557, + "args": { + "External id": 446988,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007920996.334, "dur": 0.461, + "args": { + "External id": 446989,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921004.791, "dur": 8.494, + "args": { + "External id": 446990,"Record function id": 0, "Ev Idx": 525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921006.268, "dur": 6.357, + "args": { + "External id": 446991,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007921008.748, "dur": 3.476, + "args": { + "External id": 446992,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007921009.825, "dur": 2.305, + "args": { + "External id": 446993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921018.397, "dur": 7.976, + "args": { + "External id": 446994,"Record function id": 0, "Sequence number": 5285542, "Fwd thread id": 1, "Ev Idx": 529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921019.255, "dur": 4.411, + "args": { + "External id": 446995,"Sequence number": 5285542, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 530 + } + }, + { + "ph": "f", "id": 58, "pid": 4183441, "tid": 31362, "ts": 676007921019.255, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007921020.545, "dur": 2.963, + "args": { + "External id": 446996,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921022.596, "dur": 0.790, + "args": { + "External id": 446997,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921029.800, "dur": 122.259, + "args": { + "External id": 446998,"Record function id": 0, "Sequence number": 5285541, "Fwd thread id": 1, "Ev Idx": 533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921030.664, "dur": 113.966, + "args": { + "External id": 446999,"Sequence number": 5285541, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 534 + } + }, + { + "ph": "f", "id": 59, "pid": 4183441, "tid": 31362, "ts": 676007921030.664, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921034.499, "dur": 3.258, + "args": { + "External id": 447000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921034.945, "dur": 2.375, + "args": { + "External id": 447001,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921036.893, "dur": 0.320, + "args": { + "External id": 447002,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007921040.579, "dur": 34.815, + "args": { + "External id": 447003,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921076.372, "dur": 2.727, + "args": { + "External id": 447004,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921077.017, "dur": 1.517, + "args": { + "External id": 447005,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921077.774, "dur": 0.647, + "args": { + "External id": 447006,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921080.483, "dur": 23.699, + "args": { + "External id": 447007,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921099.021, "dur": 4.133, + "args": { + "External id": 447008,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921100.719, "dur": 2.030, + "args": { + "External id": 447009,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007921106.754, "dur": 36.917, + "args": { + "External id": 447010,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921157.773, "dur": 32.884, + "args": { + "External id": 447011,"Record function id": 0, "Sequence number": 5285540, "Fwd thread id": 1, "Ev Idx": 546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921158.672, "dur": 5.275, + "args": { + "External id": 447012,"Sequence number": 5285540, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 547 + } + }, + { + "ph": "f", "id": 60, "pid": 4183441, "tid": 31362, "ts": 676007921158.672, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007921161.558, "dur": 2.244, + "args": { + "External id": 447013,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921162.371, "dur": 1.323, + "args": { + "External id": 447014,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007921167.234, "dur": 21.163, + "args": { + "External id": 447015,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921194.378, "dur": 9.138, + "args": { + "External id": 447016,"Record function id": 0, "Sequence number": 5285539, "Fwd thread id": 1, "Ev Idx": 551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921195.460, "dur": 6.258, + "args": { + "External id": 447017,"Sequence number": 5285539, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 552 + } + }, + { + "ph": "f", "id": 61, "pid": 4183441, "tid": 31362, "ts": 676007921195.460, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921196.320, "dur": 5.185, + "args": { + "External id": 447018,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921199.209, "dur": 1.785, + "args": { + "External id": 447019,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921200.180, "dur": 0.691, + "args": { + "External id": 447020,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921207.430, "dur": 5.312, + "args": { + "External id": 447021,"Record function id": 0, "Ev Idx": 556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921208.647, "dur": 3.486, + "args": { + "External id": 447022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007921209.824, "dur": 1.816, + "args": { + "External id": 447023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007921210.325, "dur": 1.226, + "args": { + "External id": 447024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921215.995, "dur": 8.488, + "args": { + "External id": 447025,"Record function id": 0, "Sequence number": 5285538, "Fwd thread id": 1, "Ev Idx": 560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921218.103, "dur": 3.120, + "args": { + "External id": 447026,"Sequence number": 5285538, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 561 + } + }, + { + "ph": "f", "id": 62, "pid": 4183441, "tid": 31362, "ts": 676007921218.103, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007921219.456, "dur": 1.614, + "args": { + "External id": 447027,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921220.055, "dur": 0.909, + "args": { + "External id": 447028,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921229.060, "dur": 92.702, + "args": { + "External id": 447029,"Record function id": 0, "Sequence number": 5285537, "Fwd thread id": 1, "Ev Idx": 564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921229.930, "dur": 83.265, + "args": { + "External id": 447030,"Sequence number": 5285537, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 565 + } + }, + { + "ph": "f", "id": 63, "pid": 4183441, "tid": 31362, "ts": 676007921229.930, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921232.581, "dur": 2.414, + "args": { + "External id": 447031,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921233.175, "dur": 1.396, + "args": { + "External id": 447032,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921234.000, "dur": 0.456, + "args": { + "External id": 447033,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007921235.604, "dur": 35.626, + "args": { + "External id": 447034,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921272.472, "dur": 4.413, + "args": { + "External id": 447035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921274.895, "dur": 1.440, + "args": { + "External id": 447036,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921275.818, "dur": 0.408, + "args": { + "External id": 447037,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921278.274, "dur": 3.656, + "args": { + "External id": 447038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921278.958, "dur": 2.521, + "args": { + "External id": 447039,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921281.139, "dur": 0.269, + "args": { + "External id": 447040,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007921282.332, "dur": 30.145, + "args": { + "External id": 447041,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921326.108, "dur": 26.630, + "args": { + "External id": 447042,"Record function id": 0, "Sequence number": 5285536, "Fwd thread id": 1, "Ev Idx": 577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921328.719, "dur": 3.578, + "args": { + "External id": 447043,"Sequence number": 5285536, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 578 + } + }, + { + "ph": "f", "id": 64, "pid": 4183441, "tid": 31362, "ts": 676007921328.719, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007921330.357, "dur": 1.774, + "args": { + "External id": 447044,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921331.016, "dur": 0.994, + "args": { + "External id": 447045,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007921334.540, "dur": 15.811, + "args": { + "External id": 447046,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921356.170, "dur": 11.831, + "args": { + "External id": 447047,"Record function id": 0, "Sequence number": 5285535, "Fwd thread id": 1, "Ev Idx": 582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921357.219, "dur": 7.705, + "args": { + "External id": 447048,"Sequence number": 5285535, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 583 + } + }, + { + "ph": "f", "id": 65, "pid": 4183441, "tid": 31362, "ts": 676007921357.219, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921358.238, "dur": 6.437, + "args": { + "External id": 447049,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921360.214, "dur": 3.956, + "args": { + "External id": 447050,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921363.587, "dur": 0.433, + "args": { + "External id": 447051,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921371.706, "dur": 4.424, + "args": { + "External id": 447052,"Record function id": 0, "Ev Idx": 587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921372.856, "dur": 2.783, + "args": { + "External id": 447053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007921373.651, "dur": 1.648, + "args": { + "External id": 447054,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007921373.987, "dur": 1.209, + "args": { + "External id": 447055,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007921380.278, "dur": 408.533, + "args": { + "External id": 447056,"Record function id": 0, "Sequence number": 5285534, "Fwd thread id": 1, "Ev Idx": 591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007921381.372, "dur": 369.705, + "args": { + "External id": 447057,"Sequence number": 5285534, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 592 + } + }, + { + "ph": "f", "id": 66, "pid": 4183441, "tid": 31362, "ts": 676007921381.372, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007921414.935, "dur": 1.594, + "args": { + "External id": 447058,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921415.366, "dur": 1.031, + "args": { + "External id": 447059,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007921431.056, "dur": 5.532, + "args": { + "External id": 447060,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007921448.238, "dur": 4.446, + "args": { + "External id": 447061,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921605.882, "dur": 1.873, + "args": { + "External id": 447062,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007921611.815, "dur": 35.497, + "args": { + "External id": 447063,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921622.191, "dur": 0.752, + "args": { + "External id": 447064,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007921653.010, "dur": 70.306, + "args": { + "External id": 447065,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007921691.553, "dur": 31.499, + "args": { + "External id": 447066,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921696.048, "dur": 5.285, + "args": { + "External id": 447067,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007921703.007, "dur": 19.502, + "args": { + "External id": 447068,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007921728.705, "dur": 4.845, + "args": { + "External id": 447069,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921731.805, "dur": 1.642, + "args": { + "External id": 447070,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007921740.518, "dur": 3.322, + "args": { + "External id": 447071,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921742.492, "dur": 1.215, + "args": { + "External id": 447072,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007921763.904, "dur": 18.767, + "args": { + "External id": 447073,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921801.084, "dur": 8.564, + "args": { + "External id": 447074,"Record function id": 0, "Ev Idx": 609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007921802.864, "dur": 6.089, + "args": { + "External id": 447075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007921804.745, "dur": 3.016, + "args": { + "External id": 447076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007921805.858, "dur": 1.803, + "args": { + "External id": 447077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921815.674, "dur": 7.262, + "args": { + "External id": 447078,"Record function id": 0, "Sequence number": 5285533, "Fwd thread id": 1, "Ev Idx": 613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007921816.831, "dur": 1.671, + "args": { + "External id": 447079,"Sequence number": 5285533, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 614 + } + }, + { + "ph": "f", "id": 67, "pid": 4183441, "tid": 31362, "ts": 676007921816.831, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007921826.806, "dur": 419.832, + "args": { + "External id": 447080,"Record function id": 0, "Sequence number": 5285532, "Fwd thread id": 1, "Ev Idx": 615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007921827.714, "dur": 404.878, + "args": { + "External id": 447081,"Sequence number": 5285532, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 616 + } + }, + { + "ph": "f", "id": 68, "pid": 4183441, "tid": 31362, "ts": 676007921827.714, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007921859.824, "dur": 7.974, + "args": { + "External id": 447082,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007921864.622, "dur": 2.900, + "args": { + "External id": 447083,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921871.816, "dur": 8.526, + "args": { + "External id": 447084,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921873.428, "dur": 6.276, + "args": { + "External id": 447085,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921877.013, "dur": 2.537, + "args": { + "External id": 447086,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 31362, + "ts": 676007921885.681, "dur": 83.900, + "args": { + "External id": 447087,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007921886.408, "dur": 2.104, + "args": { + "External id": 447088,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007921886.854, "dur": 1.249, + "args": { + "External id": 447089,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007921887.470, "dur": 0.547, + "args": { + "External id": 447090,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 31362, + "ts": 676007921889.735, "dur": 79.397, + "args": { + "External id": 447091,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007921891.170, "dur": 77.337, + "args": { + "External id": 447092,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007921973.074, "dur": 4.529, + "args": { + "External id": 447093,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007921976.058, "dur": 1.410, + "args": { + "External id": 447094,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007922009.296, "dur": 4.869, + "args": { + "External id": 447095,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007922015.141, "dur": 1.875, + "args": { + "External id": 447096,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007922017.756, "dur": 1.984, + "args": { + "External id": 447097,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922053.282, "dur": 2.007, + "args": { + "External id": 447098,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922053.874, "dur": 1.240, + "args": { + "External id": 447099,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183441, "tid": 31362, + "ts": 676007922076.818, "dur": 134.961, + "args": { + "External id": 447100,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007922097.087, "dur": 8.864, + "args": { + "External id": 447101,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922102.016, "dur": 2.838, + "args": { + "External id": 447102,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007922107.293, "dur": 6.568, + "args": { + "External id": 447103,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922112.602, "dur": 0.442, + "args": { + "External id": 447104,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007922115.360, "dur": 2.610, + "args": { + "External id": 447105,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922117.067, "dur": 0.555, + "args": { + "External id": 447106,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007922118.424, "dur": 2.053, + "args": { + "External id": 447107,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922119.306, "dur": 0.505, + "args": { + "External id": 447108,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007922125.477, "dur": 1.655, + "args": { + "External id": 447109,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922126.435, "dur": 0.414, + "args": { + "External id": 447110,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922131.080, "dur": 4.835, + "args": { + "External id": 447111,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007922133.848, "dur": 1.908, + "args": { + "External id": 447112,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007922136.544, "dur": 2.156, + "args": { + "External id": 447113,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922138.129, "dur": 0.298, + "args": { + "External id": 447114,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922139.820, "dur": 4.199, + "args": { + "External id": 447115,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922140.757, "dur": 3.160, + "args": { + "External id": 447116,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676007922145.520, "dur": 54.183, + "args": { + "External id": 447117,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922201.601, "dur": 1.215, + "args": { + "External id": 447118,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007922204.058, "dur": 3.355, + "args": { + "External id": 447119,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922206.079, "dur": 0.480, + "args": { + "External id": 447120,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922209.752, "dur": 0.914, + "args": { + "External id": 447121,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007922257.461, "dur": 8.221, + "args": { + "External id": 447122,"Record function id": 0, "Ev Idx": 657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007922259.496, "dur": 5.609, + "args": { + "External id": 447123,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007922261.478, "dur": 2.874, + "args": { + "External id": 447124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007922262.294, "dur": 1.952, + "args": { + "External id": 447125,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922269.209, "dur": 8.265, + "args": { + "External id": 447126,"Record function id": 0, "Sequence number": 5285531, "Fwd thread id": 1, "Ev Idx": 661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922270.504, "dur": 3.901, + "args": { + "External id": 447127,"Sequence number": 5285531, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 662 + } + }, + { + "ph": "f", "id": 69, "pid": 4183441, "tid": 31362, "ts": 676007922270.504, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922272.452, "dur": 1.731, + "args": { + "External id": 447128,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922273.336, "dur": 0.708, + "args": { + "External id": 447129,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922280.921, "dur": 107.655, + "args": { + "External id": 447130,"Record function id": 0, "Sequence number": 5285530, "Fwd thread id": 1, "Ev Idx": 665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922281.869, "dur": 99.658, + "args": { + "External id": 447131,"Sequence number": 5285530, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 666 + } + }, + { + "ph": "f", "id": 70, "pid": 4183441, "tid": 31362, "ts": 676007922281.869, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922287.694, "dur": 4.066, + "args": { + "External id": 447132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922288.725, "dur": 2.494, + "args": { + "External id": 447133,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922290.610, "dur": 0.472, + "args": { + "External id": 447134,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007922292.730, "dur": 35.314, + "args": { + "External id": 447135,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922329.310, "dur": 6.814, + "args": { + "External id": 447136,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922330.140, "dur": 5.053, + "args": { + "External id": 447137,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922334.051, "dur": 0.973, + "args": { + "External id": 447138,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922337.720, "dur": 5.181, + "args": { + "External id": 447139,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922338.368, "dur": 3.943, + "args": { + "External id": 447140,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922339.812, "dur": 2.432, + "args": { + "External id": 447141,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007922343.526, "dur": 37.316, + "args": { + "External id": 447142,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922393.078, "dur": 6.468, + "args": { + "External id": 447143,"Record function id": 0, "Sequence number": 5285529, "Fwd thread id": 1, "Ev Idx": 678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922394.009, "dur": 4.245, + "args": { + "External id": 447144,"Sequence number": 5285529, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 679 + } + }, + { + "ph": "f", "id": 71, "pid": 4183441, "tid": 31362, "ts": 676007922394.009, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922395.816, "dur": 2.285, + "args": { + "External id": 447145,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922396.898, "dur": 1.096, + "args": { + "External id": 447146,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922402.873, "dur": 9.416, + "args": { + "External id": 447147,"Record function id": 0, "Sequence number": 5285528, "Fwd thread id": 1, "Ev Idx": 682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922405.200, "dur": 4.467, + "args": { + "External id": 447148,"Sequence number": 5285528, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 683 + } + }, + { + "ph": "f", "id": 72, "pid": 4183441, "tid": 31362, "ts": 676007922405.200, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922406.017, "dur": 3.423, + "args": { + "External id": 447149,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922406.574, "dur": 2.303, + "args": { + "External id": 447150,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922408.373, "dur": 0.365, + "args": { + "External id": 447151,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007922416.210, "dur": 5.145, + "args": { + "External id": 447152,"Record function id": 0, "Ev Idx": 687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007922417.926, "dur": 2.940, + "args": { + "External id": 447153,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007922418.860, "dur": 1.638, + "args": { + "External id": 447154,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007922419.278, "dur": 1.142, + "args": { + "External id": 447155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922424.573, "dur": 9.145, + "args": { + "External id": 447156,"Record function id": 0, "Sequence number": 5285527, "Fwd thread id": 1, "Ev Idx": 691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922426.042, "dur": 5.224, + "args": { + "External id": 447157,"Sequence number": 5285527, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 692 + } + }, + { + "ph": "f", "id": 73, "pid": 4183441, "tid": 31362, "ts": 676007922426.042, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922427.832, "dur": 3.287, + "args": { + "External id": 447158,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922430.372, "dur": 0.614, + "args": { + "External id": 447159,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922436.604, "dur": 94.964, + "args": { + "External id": 447160,"Record function id": 0, "Sequence number": 5285526, "Fwd thread id": 1, "Ev Idx": 695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922437.653, "dur": 84.780, + "args": { + "External id": 447161,"Sequence number": 5285526, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 696 + } + }, + { + "ph": "f", "id": 74, "pid": 4183441, "tid": 31362, "ts": 676007922437.653, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922440.276, "dur": 4.979, + "args": { + "External id": 447162,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922440.987, "dur": 3.831, + "args": { + "External id": 447163,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922444.070, "dur": 0.637, + "args": { + "External id": 447164,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007922447.829, "dur": 27.718, + "args": { + "External id": 447165,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922476.495, "dur": 6.418, + "args": { + "External id": 447166,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922477.136, "dur": 5.251, + "args": { + "External id": 447167,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922478.533, "dur": 3.709, + "args": { + "External id": 447168,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922484.222, "dur": 4.563, + "args": { + "External id": 447169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922484.862, "dur": 3.477, + "args": { + "External id": 447170,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922487.701, "dur": 0.527, + "args": { + "External id": 447171,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007922489.395, "dur": 32.246, + "args": { + "External id": 447172,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922535.699, "dur": 30.845, + "args": { + "External id": 447173,"Record function id": 0, "Sequence number": 5285525, "Fwd thread id": 1, "Ev Idx": 708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922536.521, "dur": 4.273, + "args": { + "External id": 447174,"Sequence number": 5285525, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 709 + } + }, + { + "ph": "f", "id": 75, "pid": 4183441, "tid": 31362, "ts": 676007922536.521, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922538.448, "dur": 2.179, + "args": { + "External id": 447175,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922539.401, "dur": 1.126, + "args": { + "External id": 447176,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007922543.487, "dur": 20.384, + "args": { + "External id": 447177,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922570.150, "dur": 10.375, + "args": { + "External id": 447178,"Record function id": 0, "Sequence number": 5285524, "Fwd thread id": 1, "Ev Idx": 713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007922571.194, "dur": 6.338, + "args": { + "External id": 447179,"Sequence number": 5285524, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 714 + } + }, + { + "ph": "f", "id": 76, "pid": 4183441, "tid": 31362, "ts": 676007922571.194, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007922571.993, "dur": 5.331, + "args": { + "External id": 447180,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007922572.888, "dur": 3.950, + "args": { + "External id": 447181,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922576.170, "dur": 0.558, + "args": { + "External id": 447182,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007922584.437, "dur": 4.879, + "args": { + "External id": 447183,"Record function id": 0, "Ev Idx": 718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007922586.210, "dur": 2.691, + "args": { + "External id": 447184,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007922587.186, "dur": 1.467, + "args": { + "External id": 447185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007922587.616, "dur": 0.962, + "args": { + "External id": 447186,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007922596.016, "dur": 458.319, + "args": { + "External id": 447187,"Record function id": 0, "Sequence number": 5285523, "Fwd thread id": 1, "Ev Idx": 722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007922597.618, "dur": 421.218, + "args": { + "External id": 447188,"Sequence number": 5285523, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 723 + } + }, + { + "ph": "f", "id": 77, "pid": 4183441, "tid": 31362, "ts": 676007922597.618, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 31362, + "ts": 676007922618.905, "dur": 33.968, + "args": { + "External id": 447189,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007922620.310, "dur": 32.333, + "args": { + "External id": 447190,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007922623.216, "dur": 6.095, + "args": { + "External id": 447191,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007922626.016, "dur": 2.850, + "args": { + "External id": 447192,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007922630.456, "dur": 21.499, + "args": { + "External id": 447193,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922701.956, "dur": 7.040, + "args": { + "External id": 447194,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922704.897, "dur": 3.849, + "args": { + "External id": 447195,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007922713.273, "dur": 1.818, + "args": { + "External id": 447196,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922714.178, "dur": 0.830, + "args": { + "External id": 447197,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007922726.488, "dur": 3.443, + "args": { + "External id": 447198,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007922740.888, "dur": 2.573, + "args": { + "External id": 447199,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922912.417, "dur": 2.829, + "args": { + "External id": 447200,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007922919.316, "dur": 33.211, + "args": { + "External id": 447201,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922928.090, "dur": 0.771, + "args": { + "External id": 447202,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007922958.285, "dur": 28.209, + "args": { + "External id": 447203,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007922960.139, "dur": 26.130, + "args": { + "External id": 447204,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007922964.184, "dur": 4.097, + "args": { + "External id": 447205,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007922969.638, "dur": 16.129, + "args": { + "External id": 447206,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007922990.726, "dur": 4.379, + "args": { + "External id": 447207,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007922994.050, "dur": 0.903, + "args": { + "External id": 447208,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007923001.293, "dur": 4.549, + "args": { + "External id": 447209,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007923002.312, "dur": 3.434, + "args": { + "External id": 447210,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007923008.155, "dur": 1.918, + "args": { + "External id": 447211,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007923008.933, "dur": 1.056, + "args": { + "External id": 447212,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007923035.486, "dur": 17.335, + "args": { + "External id": 447213,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007923067.083, "dur": 10.544, + "args": { + "External id": 447214,"Record function id": 0, "Ev Idx": 749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007923069.493, "dur": 7.475, + "args": { + "External id": 447215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007923071.192, "dur": 4.947, + "args": { + "External id": 447216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007923074.135, "dur": 1.896, + "args": { + "External id": 447217,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923097.934, "dur": 12.086, + "args": { + "External id": 447218,"Record function id": 0, "Sequence number": 5285522, "Fwd thread id": 1, "Ev Idx": 753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923100.128, "dur": 5.611, + "args": { + "External id": 447219,"Sequence number": 5285522, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 754 + } + }, + { + "ph": "f", "id": 78, "pid": 4183441, "tid": 31362, "ts": 676007923100.128, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007923102.228, "dur": 3.266, + "args": { + "External id": 447220,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007923103.253, "dur": 1.969, + "args": { + "External id": 447221,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923114.929, "dur": 139.883, + "args": { + "External id": 447222,"Record function id": 0, "Sequence number": 5285521, "Fwd thread id": 1, "Ev Idx": 757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923115.813, "dur": 131.918, + "args": { + "External id": 447223,"Sequence number": 5285521, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 758 + } + }, + { + "ph": "f", "id": 79, "pid": 4183441, "tid": 31362, "ts": 676007923115.813, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007923120.086, "dur": 7.265, + "args": { + "External id": 447224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007923123.617, "dur": 3.004, + "args": { + "External id": 447225,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923125.601, "dur": 0.845, + "args": { + "External id": 447226,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007923128.430, "dur": 69.847, + "args": { + "External id": 447227,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007923199.445, "dur": 5.427, + "args": { + "External id": 447228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007923200.152, "dur": 4.036, + "args": { + "External id": 447229,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923201.733, "dur": 2.325, + "args": { + "External id": 447230,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007923208.654, "dur": 3.557, + "args": { + "External id": 447231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007923209.487, "dur": 2.235, + "args": { + "External id": 447232,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923211.174, "dur": 0.482, + "args": { + "External id": 447233,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007923212.654, "dur": 34.343, + "args": { + "External id": 447234,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923259.648, "dur": 9.795, + "args": { + "External id": 447235,"Record function id": 0, "Sequence number": 5285520, "Fwd thread id": 1, "Ev Idx": 770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923260.537, "dur": 6.467, + "args": { + "External id": 447236,"Sequence number": 5285520, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 771 + } + }, + { + "ph": "f", "id": 80, "pid": 4183441, "tid": 31362, "ts": 676007923260.537, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007923262.604, "dur": 4.252, + "args": { + "External id": 447237,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007923263.583, "dur": 3.137, + "args": { + "External id": 447238,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923272.804, "dur": 9.462, + "args": { + "External id": 447239,"Record function id": 0, "Sequence number": 5285519, "Fwd thread id": 1, "Ev Idx": 774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923275.569, "dur": 4.031, + "args": { + "External id": 447240,"Sequence number": 5285519, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 775 + } + }, + { + "ph": "f", "id": 81, "pid": 4183441, "tid": 31362, "ts": 676007923275.569, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007923276.362, "dur": 3.027, + "args": { + "External id": 447241,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007923276.845, "dur": 2.015, + "args": { + "External id": 447242,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923278.176, "dur": 0.571, + "args": { + "External id": 447243,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007923286.253, "dur": 5.917, + "args": { + "External id": 447244,"Record function id": 0, "Ev Idx": 779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007923287.978, "dur": 3.668, + "args": { + "External id": 447245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007923289.231, "dur": 2.069, + "args": { + "External id": 447246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007923289.832, "dur": 1.382, + "args": { + "External id": 447247,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923295.129, "dur": 8.953, + "args": { + "External id": 447248,"Record function id": 0, "Sequence number": 5285518, "Fwd thread id": 1, "Ev Idx": 783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007923296.147, "dur": 5.373, + "args": { + "External id": 447249,"Sequence number": 5285518, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 784 + } + }, + { + "ph": "f", "id": 82, "pid": 4183441, "tid": 31362, "ts": 676007923296.147, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007923299.182, "dur": 2.180, + "args": { + "External id": 447250,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007923300.055, "dur": 1.169, + "args": { + "External id": 447251,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007923308.552, "dur": 280.068, + "args": { + "External id": 447252,"Record function id": 0, "Sequence number": 5285517, "Fwd thread id": 1, "Ev Idx": 787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007923310.172, "dur": 256.236, + "args": { + "External id": 447253,"Sequence number": 5285517, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 788 + } + }, + { + "ph": "f", "id": 83, "pid": 4183441, "tid": 31362, "ts": 676007923310.172, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007923328.247, "dur": 6.593, + "args": { + "External id": 447254,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923330.873, "dur": 3.554, + "args": { + "External id": 447255,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007923336.956, "dur": 3.800, + "args": { + "External id": 447256,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923338.597, "dur": 1.965, + "args": { + "External id": 447257,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007923342.197, "dur": 4.689, + "args": { + "External id": 447258,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923344.088, "dur": 2.605, + "args": { + "External id": 447259,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676007923372.135, "dur": 170.000, + "args": { + "External id": 447260,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007923449.093, "dur": 3.334, + "args": { + "External id": 447261,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007923454.193, "dur": 3.730, + "args": { + "External id": 447262,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007923554.641, "dur": 3.086, + "args": { + "External id": 447263,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007923560.410, "dur": 0.684, + "args": { + "External id": 447264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007923563.160, "dur": 0.791, + "args": { + "External id": 447265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007923595.511, "dur": 266.334, + "args": { + "External id": 447266,"Record function id": 0, "Sequence number": 5285516, "Fwd thread id": 1, "Ev Idx": 801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007923597.405, "dur": 254.989, + "args": { + "External id": 447267,"Sequence number": 5285516, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 802 + } + }, + { + "ph": "f", "id": 84, "pid": 4183441, "tid": 31362, "ts": 676007923597.405, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007923617.564, "dur": 81.632, + "args": { + "External id": 447268,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923620.757, "dur": 2.718, + "args": { + "External id": 447269,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007923624.638, "dur": 73.481, + "args": { + "External id": 447270,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007923710.842, "dur": 5.975, + "args": { + "External id": 447271,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923713.204, "dur": 3.298, + "args": { + "External id": 447272,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007923871.480, "dur": 151.803, + "args": { + "External id": 447273,"Record function id": 0, "Sequence number": 5285515, "Fwd thread id": 1, "Ev Idx": 808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007923873.529, "dur": 142.592, + "args": { + "External id": 447274,"Sequence number": 5285515, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 809 + } + }, + { + "ph": "f", "id": 85, "pid": 4183441, "tid": 31362, "ts": 676007923873.529, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007923886.091, "dur": 34.491, + "args": { + "External id": 447275,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923888.972, "dur": 2.360, + "args": { + "External id": 447276,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007923892.288, "dur": 27.756, + "args": { + "External id": 447277,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007923927.766, "dur": 5.153, + "args": { + "External id": 447278,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007923929.924, "dur": 2.703, + "args": { + "External id": 447279,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924029.317, "dur": 16.182, + "args": { + "External id": 447280,"Record function id": 0, "Sequence number": 5285514, "Fwd thread id": 1, "Ev Idx": 815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924030.552, "dur": 11.308, + "args": { + "External id": 447281,"Sequence number": 5285514, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 816 + } + }, + { + "ph": "f", "id": 86, "pid": 4183441, "tid": 31362, "ts": 676007924030.552, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924033.056, "dur": 8.558, + "args": { + "External id": 447282,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924036.215, "dur": 5.232, + "args": { + "External id": 447283,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924048.870, "dur": 7.177, + "args": { + "External id": 447284,"Record function id": 0, "Sequence number": 5285513, "Fwd thread id": 1, "Ev Idx": 819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924049.815, "dur": 3.586, + "args": { + "External id": 447285,"Sequence number": 5285513, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 820 + } + }, + { + "ph": "f", "id": 87, "pid": 4183441, "tid": 31362, "ts": 676007924049.815, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924051.334, "dur": 1.930, + "args": { + "External id": 447286,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924052.123, "dur": 0.997, + "args": { + "External id": 447287,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924061.052, "dur": 6.438, + "args": { + "External id": 447288,"Record function id": 0, "Sequence number": 5285512, "Fwd thread id": 1, "Ev Idx": 823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924061.829, "dur": 3.376, + "args": { + "External id": 447289,"Sequence number": 5285512, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 824 + } + }, + { + "ph": "f", "id": 88, "pid": 4183441, "tid": 31362, "ts": 676007924061.829, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924063.287, "dur": 1.776, + "args": { + "External id": 447290,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924064.094, "dur": 0.843, + "args": { + "External id": 447291,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924071.134, "dur": 8.986, + "args": { + "External id": 447292,"Record function id": 0, "Sequence number": 5285511, "Fwd thread id": 1, "Ev Idx": 827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924072.627, "dur": 5.047, + "args": { + "External id": 447293,"Sequence number": 5285511, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 828 + } + }, + { + "ph": "f", "id": 89, "pid": 4183441, "tid": 31362, "ts": 676007924072.627, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924073.781, "dur": 3.746, + "args": { + "External id": 447294,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924076.652, "dur": 0.779, + "args": { + "External id": 447295,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924102.375, "dur": 160.638, + "args": { + "External id": 447296,"Record function id": 0, "Sequence number": 5285510, "Fwd thread id": 1, "Ev Idx": 831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924103.711, "dur": 149.489, + "args": { + "External id": 447297,"Sequence number": 5285510, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 832 + } + }, + { + "ph": "f", "id": 90, "pid": 4183441, "tid": 31362, "ts": 676007924103.711, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924108.289, "dur": 7.399, + "args": { + "External id": 447298,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924110.209, "dur": 4.630, + "args": { + "External id": 447299,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924112.896, "dur": 1.575, + "args": { + "External id": 447300,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007924119.162, "dur": 79.202, + "args": { + "External id": 447301,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924199.691, "dur": 4.741, + "args": { + "External id": 447302,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924200.404, "dur": 3.249, + "args": { + "External id": 447303,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924202.344, "dur": 1.156, + "args": { + "External id": 447304,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924206.350, "dur": 5.606, + "args": { + "External id": 447305,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924207.241, "dur": 4.095, + "args": { + "External id": 447306,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924210.955, "dur": 0.314, + "args": { + "External id": 447307,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007924212.556, "dur": 39.737, + "args": { + "External id": 447308,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924267.569, "dur": 6.713, + "args": { + "External id": 447309,"Record function id": 0, "Sequence number": 5285509, "Fwd thread id": 1, "Ev Idx": 844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924268.357, "dur": 4.349, + "args": { + "External id": 447310,"Sequence number": 5285509, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 845 + } + }, + { + "ph": "f", "id": 91, "pid": 4183441, "tid": 31362, "ts": 676007924268.357, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924270.079, "dur": 2.492, + "args": { + "External id": 447311,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924271.233, "dur": 1.250, + "args": { + "External id": 447312,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924277.455, "dur": 9.027, + "args": { + "External id": 447313,"Record function id": 0, "Sequence number": 5285508, "Fwd thread id": 1, "Ev Idx": 848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924278.399, "dur": 6.133, + "args": { + "External id": 447314,"Sequence number": 5285508, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 849 + } + }, + { + "ph": "f", "id": 92, "pid": 4183441, "tid": 31362, "ts": 676007924278.399, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924279.436, "dur": 4.888, + "args": { + "External id": 447315,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924280.015, "dur": 3.791, + "args": { + "External id": 447316,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924283.220, "dur": 0.431, + "args": { + "External id": 447317,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007924292.210, "dur": 8.864, + "args": { + "External id": 447318,"Record function id": 0, "Ev Idx": 853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007924294.042, "dur": 6.407, + "args": { + "External id": 447319,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007924296.468, "dur": 3.612, + "args": { + "External id": 447320,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007924297.512, "dur": 2.467, + "args": { + "External id": 447321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924304.237, "dur": 6.351, + "args": { + "External id": 447322,"Record function id": 0, "Sequence number": 5285507, "Fwd thread id": 1, "Ev Idx": 857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924305.310, "dur": 3.226, + "args": { + "External id": 447323,"Sequence number": 5285507, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 858 + } + }, + { + "ph": "f", "id": 93, "pid": 4183441, "tid": 31362, "ts": 676007924305.310, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924306.650, "dur": 1.729, + "args": { + "External id": 447324,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924307.590, "dur": 0.663, + "args": { + "External id": 447325,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924313.722, "dur": 94.490, + "args": { + "External id": 447326,"Record function id": 0, "Sequence number": 5285506, "Fwd thread id": 1, "Ev Idx": 861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924314.509, "dur": 88.352, + "args": { + "External id": 447327,"Sequence number": 5285506, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 862 + } + }, + { + "ph": "f", "id": 94, "pid": 4183441, "tid": 31362, "ts": 676007924314.509, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924319.068, "dur": 3.090, + "args": { + "External id": 447328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924319.679, "dur": 2.036, + "args": { + "External id": 447329,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924321.190, "dur": 0.421, + "args": { + "External id": 447330,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007924322.934, "dur": 33.888, + "args": { + "External id": 447331,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924357.875, "dur": 3.924, + "args": { + "External id": 447332,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924358.406, "dur": 2.763, + "args": { + "External id": 447333,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924359.788, "dur": 1.249, + "args": { + "External id": 447334,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924364.861, "dur": 5.427, + "args": { + "External id": 447335,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924365.686, "dur": 4.169, + "args": { + "External id": 447336,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924367.148, "dur": 2.626, + "args": { + "External id": 447337,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007924370.763, "dur": 31.289, + "args": { + "External id": 447338,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924412.556, "dur": 34.200, + "args": { + "External id": 447339,"Record function id": 0, "Sequence number": 5285505, "Fwd thread id": 1, "Ev Idx": 874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924413.611, "dur": 4.287, + "args": { + "External id": 447340,"Sequence number": 5285505, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 875 + } + }, + { + "ph": "f", "id": 95, "pid": 4183441, "tid": 31362, "ts": 676007924413.611, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924415.603, "dur": 2.147, + "args": { + "External id": 447341,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924416.680, "dur": 0.974, + "args": { + "External id": 447342,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007924421.031, "dur": 21.407, + "args": { + "External id": 447343,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924450.388, "dur": 8.237, + "args": { + "External id": 447344,"Record function id": 0, "Sequence number": 5285504, "Fwd thread id": 1, "Ev Idx": 879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924451.324, "dur": 4.923, + "args": { + "External id": 447345,"Sequence number": 5285504, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 880 + } + }, + { + "ph": "f", "id": 96, "pid": 4183441, "tid": 31362, "ts": 676007924451.324, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924452.523, "dur": 3.500, + "args": { + "External id": 447346,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924453.321, "dur": 2.165, + "args": { + "External id": 447347,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924454.887, "dur": 0.483, + "args": { + "External id": 447348,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007924462.670, "dur": 7.317, + "args": { + "External id": 447349,"Record function id": 0, "Ev Idx": 884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007924464.198, "dur": 5.309, + "args": { + "External id": 447350,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007924465.022, "dur": 4.238, + "args": { + "External id": 447351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007924467.740, "dur": 1.407, + "args": { + "External id": 447352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924473.165, "dur": 6.626, + "args": { + "External id": 447353,"Record function id": 0, "Sequence number": 5285503, "Fwd thread id": 1, "Ev Idx": 888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924474.388, "dur": 3.350, + "args": { + "External id": 447354,"Sequence number": 5285503, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 889 + } + }, + { + "ph": "f", "id": 97, "pid": 4183441, "tid": 31362, "ts": 676007924474.388, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924475.801, "dur": 1.783, + "args": { + "External id": 447355,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924476.695, "dur": 0.789, + "args": { + "External id": 447356,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924485.108, "dur": 98.969, + "args": { + "External id": 447357,"Record function id": 0, "Sequence number": 5285502, "Fwd thread id": 1, "Ev Idx": 892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924485.959, "dur": 88.941, + "args": { + "External id": 447358,"Sequence number": 5285502, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 893 + } + }, + { + "ph": "f", "id": 98, "pid": 4183441, "tid": 31362, "ts": 676007924485.959, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924488.887, "dur": 4.508, + "args": { + "External id": 447359,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924489.526, "dur": 3.425, + "args": { + "External id": 447360,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924492.414, "dur": 0.420, + "args": { + "External id": 447361,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007924494.182, "dur": 35.999, + "args": { + "External id": 447362,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924531.255, "dur": 4.263, + "args": { + "External id": 447363,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924531.888, "dur": 2.961, + "args": { + "External id": 447364,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924533.443, "dur": 1.288, + "args": { + "External id": 447365,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924536.567, "dur": 7.182, + "args": { + "External id": 447366,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924541.304, "dur": 1.991, + "args": { + "External id": 447367,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924542.704, "dur": 0.513, + "args": { + "External id": 447368,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007924544.194, "dur": 30.173, + "args": { + "External id": 447369,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924588.200, "dur": 25.613, + "args": { + "External id": 447370,"Record function id": 0, "Sequence number": 5285501, "Fwd thread id": 1, "Ev Idx": 905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924589.121, "dur": 4.033, + "args": { + "External id": 447371,"Sequence number": 5285501, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 906 + } + }, + { + "ph": "f", "id": 99, "pid": 4183441, "tid": 31362, "ts": 676007924589.121, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924590.784, "dur": 2.229, + "args": { + "External id": 447372,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924591.839, "dur": 1.052, + "args": { + "External id": 447373,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007924595.361, "dur": 16.476, + "args": { + "External id": 447374,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924617.221, "dur": 9.422, + "args": { + "External id": 447375,"Record function id": 0, "Sequence number": 5285500, "Fwd thread id": 1, "Ev Idx": 910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007924620.264, "dur": 4.602, + "args": { + "External id": 447376,"Sequence number": 5285500, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 911 + } + }, + { + "ph": "f", "id": 100, "pid": 4183441, "tid": 31362, "ts": 676007924620.264, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007924621.244, "dur": 3.431, + "args": { + "External id": 447377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007924621.932, "dur": 2.229, + "args": { + "External id": 447378,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924623.646, "dur": 0.361, + "args": { + "External id": 447379,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007924630.663, "dur": 4.823, + "args": { + "External id": 447380,"Record function id": 0, "Ev Idx": 915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007924632.324, "dur": 2.721, + "args": { + "External id": 447381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007924633.226, "dur": 1.580, + "args": { + "External id": 447382,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007924633.632, "dur": 1.056, + "args": { + "External id": 447383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007924639.745, "dur": 400.028, + "args": { + "External id": 447384,"Record function id": 0, "Sequence number": 5285499, "Fwd thread id": 1, "Ev Idx": 919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007924641.360, "dur": 364.677, + "args": { + "External id": 447385,"Sequence number": 5285499, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 920 + } + }, + { + "ph": "f", "id": 101, "pid": 4183441, "tid": 31362, "ts": 676007924641.360, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924721.236, "dur": 5.146, + "args": { + "External id": 447386,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924723.963, "dur": 2.116, + "args": { + "External id": 447387,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007924739.693, "dur": 6.588, + "args": { + "External id": 447388,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007924755.418, "dur": 2.528, + "args": { + "External id": 447389,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924902.137, "dur": 2.000, + "args": { + "External id": 447390,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007924908.203, "dur": 35.452, + "args": { + "External id": 447391,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924918.860, "dur": 1.140, + "args": { + "External id": 447392,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007924952.423, "dur": 30.787, + "args": { + "External id": 447393,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007924954.414, "dur": 28.577, + "args": { + "External id": 447394,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007924960.250, "dur": 4.898, + "args": { + "External id": 447395,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007924966.672, "dur": 15.750, + "args": { + "External id": 447396,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007924987.383, "dur": 2.592, + "args": { + "External id": 447397,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924988.919, "dur": 0.960, + "args": { + "External id": 447398,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007924996.932, "dur": 2.539, + "args": { + "External id": 447399,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007924998.399, "dur": 0.926, + "args": { + "External id": 447400,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007925019.354, "dur": 16.310, + "args": { + "External id": 447401,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925052.512, "dur": 9.053, + "args": { + "External id": 447402,"Record function id": 0, "Ev Idx": 937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925054.803, "dur": 6.046, + "args": { + "External id": 447403,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007925056.822, "dur": 2.999, + "args": { + "External id": 447404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007925057.922, "dur": 1.796, + "args": { + "External id": 447405,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925065.433, "dur": 7.014, + "args": { + "External id": 447406,"Record function id": 0, "Sequence number": 5285498, "Fwd thread id": 1, "Ev Idx": 941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925066.985, "dur": 1.195, + "args": { + "External id": 447407,"Sequence number": 5285498, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 942 + } + }, + { + "ph": "f", "id": 102, "pid": 4183441, "tid": 31362, "ts": 676007925066.985, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007925076.479, "dur": 415.363, + "args": { + "External id": 447408,"Record function id": 0, "Sequence number": 5285497, "Fwd thread id": 1, "Ev Idx": 943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007925077.802, "dur": 399.212, + "args": { + "External id": 447409,"Sequence number": 5285497, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 944 + } + }, + { + "ph": "f", "id": 103, "pid": 4183441, "tid": 31362, "ts": 676007925077.802, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925130.389, "dur": 9.361, + "args": { + "External id": 447410,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007925135.867, "dur": 3.526, + "args": { + "External id": 447411,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925143.026, "dur": 5.516, + "args": { + "External id": 447412,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925144.716, "dur": 3.042, + "args": { + "External id": 447413,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925146.825, "dur": 0.774, + "args": { + "External id": 447414,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 31362, + "ts": 676007925152.235, "dur": 92.676, + "args": { + "External id": 447415,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925153.094, "dur": 6.619, + "args": { + "External id": 447416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925155.815, "dur": 3.414, + "args": { + "External id": 447417,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925157.299, "dur": 1.771, + "args": { + "External id": 447418,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 31362, + "ts": 676007925160.902, "dur": 83.228, + "args": { + "External id": 447419,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007925162.246, "dur": 81.082, + "args": { + "External id": 447420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007925248.654, "dur": 3.107, + "args": { + "External id": 447421,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925250.168, "dur": 1.468, + "args": { + "External id": 447422,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007925285.332, "dur": 5.143, + "args": { + "External id": 447423,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007925291.876, "dur": 1.936, + "args": { + "External id": 447424,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007925294.990, "dur": 1.584, + "args": { + "External id": 447425,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925326.612, "dur": 2.260, + "args": { + "External id": 447426,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925327.647, "dur": 1.075, + "args": { + "External id": 447427,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183441, "tid": 31362, + "ts": 676007925349.987, "dur": 107.966, + "args": { + "External id": 447428,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007925354.736, "dur": 5.045, + "args": { + "External id": 447429,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925358.482, "dur": 0.635, + "args": { + "External id": 447430,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007925361.602, "dur": 8.207, + "args": { + "External id": 447431,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925366.586, "dur": 2.409, + "args": { + "External id": 447432,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007925371.061, "dur": 2.745, + "args": { + "External id": 447433,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925372.955, "dur": 0.452, + "args": { + "External id": 447434,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007925374.705, "dur": 2.891, + "args": { + "External id": 447435,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925376.549, "dur": 0.618, + "args": { + "External id": 447436,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007925381.224, "dur": 2.888, + "args": { + "External id": 447437,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925383.193, "dur": 0.616, + "args": { + "External id": 447438,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925385.229, "dur": 5.493, + "args": { + "External id": 447439,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007925388.629, "dur": 1.875, + "args": { + "External id": 447440,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007925391.969, "dur": 2.534, + "args": { + "External id": 447441,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925393.909, "dur": 0.284, + "args": { + "External id": 447442,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925397.227, "dur": 3.982, + "args": { + "External id": 447443,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925398.168, "dur": 2.929, + "args": { + "External id": 447444,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676007925402.292, "dur": 42.632, + "args": { + "External id": 447445,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925446.981, "dur": 2.819, + "args": { + "External id": 447446,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007925451.045, "dur": 3.001, + "args": { + "External id": 447447,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925453.071, "dur": 0.408, + "args": { + "External id": 447448,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925456.152, "dur": 0.814, + "args": { + "External id": 447449,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925502.243, "dur": 8.519, + "args": { + "External id": 447450,"Record function id": 0, "Ev Idx": 985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925504.522, "dur": 5.526, + "args": { + "External id": 447451,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007925506.347, "dur": 2.979, + "args": { + "External id": 447452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007925507.271, "dur": 1.944, + "args": { + "External id": 447453,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925514.646, "dur": 6.935, + "args": { + "External id": 447454,"Record function id": 0, "Sequence number": 5285496, "Fwd thread id": 1, "Ev Idx": 989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925515.903, "dur": 3.415, + "args": { + "External id": 447455,"Sequence number": 5285496, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 990 + } + }, + { + "ph": "f", "id": 104, "pid": 4183441, "tid": 31362, "ts": 676007925515.903, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925517.450, "dur": 1.645, + "args": { + "External id": 447456,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925518.211, "dur": 0.748, + "args": { + "External id": 447457,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925524.927, "dur": 103.071, + "args": { + "External id": 447458,"Record function id": 0, "Sequence number": 5285495, "Fwd thread id": 1, "Ev Idx": 993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925526.081, "dur": 94.519, + "args": { + "External id": 447459,"Sequence number": 5285495, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 994 + } + }, + { + "ph": "f", "id": 105, "pid": 4183441, "tid": 31362, "ts": 676007925526.081, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925529.683, "dur": 5.284, + "args": { + "External id": 447460,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925530.706, "dur": 3.746, + "args": { + "External id": 447461,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925533.854, "dur": 0.433, + "args": { + "External id": 447462,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007925535.882, "dur": 33.345, + "args": { + "External id": 447463,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925570.087, "dur": 3.871, + "args": { + "External id": 447464,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925570.652, "dur": 2.613, + "args": { + "External id": 447465,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925572.271, "dur": 0.834, + "args": { + "External id": 447466,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925575.556, "dur": 5.802, + "args": { + "External id": 447467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925578.420, "dur": 2.435, + "args": { + "External id": 447468,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925580.256, "dur": 0.461, + "args": { + "External id": 447469,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007925581.831, "dur": 37.905, + "args": { + "External id": 447470,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925632.706, "dur": 6.869, + "args": { + "External id": 447471,"Record function id": 0, "Sequence number": 5285494, "Fwd thread id": 1, "Ev Idx": 1006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925633.895, "dur": 4.244, + "args": { + "External id": 447472,"Sequence number": 5285494, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1007 + } + }, + { + "ph": "f", "id": 106, "pid": 4183441, "tid": 31362, "ts": 676007925633.895, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925635.600, "dur": 2.388, + "args": { + "External id": 447473,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925636.488, "dur": 1.400, + "args": { + "External id": 447474,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925642.790, "dur": 9.561, + "args": { + "External id": 447475,"Record function id": 0, "Sequence number": 5285493, "Fwd thread id": 1, "Ev Idx": 1010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925643.834, "dur": 6.217, + "args": { + "External id": 447476,"Sequence number": 5285493, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1011 + } + }, + { + "ph": "f", "id": 107, "pid": 4183441, "tid": 31362, "ts": 676007925643.834, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925645.007, "dur": 4.815, + "args": { + "External id": 447477,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925647.330, "dur": 1.966, + "args": { + "External id": 447478,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925648.716, "dur": 0.494, + "args": { + "External id": 447479,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925695.598, "dur": 7.858, + "args": { + "External id": 447480,"Record function id": 0, "Ev Idx": 1015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925698.068, "dur": 4.563, + "args": { + "External id": 447481,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007925699.686, "dur": 2.575, + "args": { + "External id": 447482,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007925700.366, "dur": 1.676, + "args": { + "External id": 447483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925708.975, "dur": 7.676, + "args": { + "External id": 447484,"Record function id": 0, "Sequence number": 5285492, "Fwd thread id": 1, "Ev Idx": 1019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925710.465, "dur": 3.756, + "args": { + "External id": 447485,"Sequence number": 5285492, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 1020 + } + }, + { + "ph": "f", "id": 108, "pid": 4183441, "tid": 31362, "ts": 676007925710.465, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925712.262, "dur": 1.810, + "args": { + "External id": 447486,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925712.963, "dur": 0.974, + "args": { + "External id": 447487,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925721.593, "dur": 119.921, + "args": { + "External id": 447488,"Record function id": 0, "Sequence number": 5285491, "Fwd thread id": 1, "Ev Idx": 1023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925743.269, "dur": 88.998, + "args": { + "External id": 447489,"Sequence number": 5285491, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1024 + } + }, + { + "ph": "f", "id": 109, "pid": 4183441, "tid": 31362, "ts": 676007925743.269, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925746.373, "dur": 2.870, + "args": { + "External id": 447490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925746.946, "dur": 1.848, + "args": { + "External id": 447491,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 1026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925748.222, "dur": 0.468, + "args": { + "External id": 447492,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007925749.996, "dur": 32.012, + "args": { + "External id": 447493,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 1028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925784.993, "dur": 4.802, + "args": { + "External id": 447494,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925785.554, "dur": 3.639, + "args": { + "External id": 447495,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925787.310, "dur": 1.738, + "args": { + "External id": 447496,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925790.936, "dur": 4.898, + "args": { + "External id": 447497,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925791.923, "dur": 3.286, + "args": { + "External id": 447498,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925793.218, "dur": 1.921, + "args": { + "External id": 447499,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007925798.554, "dur": 33.107, + "args": { + "External id": 447500,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925845.809, "dur": 31.209, + "args": { + "External id": 447501,"Record function id": 0, "Sequence number": 5285490, "Fwd thread id": 1, "Ev Idx": 1036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925846.672, "dur": 4.236, + "args": { + "External id": 447502,"Sequence number": 5285490, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1037 + } + }, + { + "ph": "f", "id": 110, "pid": 4183441, "tid": 31362, "ts": 676007925846.672, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925848.659, "dur": 2.107, + "args": { + "External id": 447503,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925849.685, "dur": 0.946, + "args": { + "External id": 447504,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007925854.214, "dur": 20.124, + "args": { + "External id": 447505,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925880.565, "dur": 10.689, + "args": { + "External id": 447506,"Record function id": 0, "Sequence number": 5285489, "Fwd thread id": 1, "Ev Idx": 1041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007925881.528, "dur": 7.154, + "args": { + "External id": 447507,"Sequence number": 5285489, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1042 + } + }, + { + "ph": "f", "id": 111, "pid": 4183441, "tid": 31362, "ts": 676007925881.528, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007925882.348, "dur": 6.132, + "args": { + "External id": 447508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007925882.865, "dur": 5.077, + "args": { + "External id": 447509,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007925887.207, "dur": 0.627, + "args": { + "External id": 447510,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925895.469, "dur": 5.334, + "args": { + "External id": 447511,"Record function id": 0, "Ev Idx": 1046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007925897.194, "dur": 3.113, + "args": { + "External id": 447512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007925898.270, "dur": 1.577, + "args": { + "External id": 447513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007925898.654, "dur": 1.102, + "args": { + "External id": 447514,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007925905.226, "dur": 439.778, + "args": { + "External id": 447515,"Record function id": 0, "Sequence number": 5285488, "Fwd thread id": 1, "Ev Idx": 1050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007925906.901, "dur": 403.932, + "args": { + "External id": 447516,"Sequence number": 5285488, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 1051 + } + }, + { + "ph": "f", "id": 112, "pid": 4183441, "tid": 31362, "ts": 676007925906.901, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 31362, + "ts": 676007925932.983, "dur": 32.857, + "args": { + "External id": 447517,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007925934.318, "dur": 31.306, + "args": { + "External id": 447518,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007925937.249, "dur": 5.809, + "args": { + "External id": 447519,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 1054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007925939.777, "dur": 2.843, + "args": { + "External id": 447520,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007925944.360, "dur": 20.759, + "args": { + "External id": 447521,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925977.350, "dur": 2.539, + "args": { + "External id": 447522,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925978.561, "dur": 1.214, + "args": { + "External id": 447523,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007925985.243, "dur": 3.267, + "args": { + "External id": 447524,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007925986.138, "dur": 2.235, + "args": { + "External id": 447525,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007925999.720, "dur": 1.991, + "args": { + "External id": 447526,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007926012.446, "dur": 3.207, + "args": { + "External id": 447527,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007926202.845, "dur": 3.508, + "args": { + "External id": 447528,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007926210.818, "dur": 31.844, + "args": { + "External id": 447529,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926219.926, "dur": 1.075, + "args": { + "External id": 447530,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007926248.402, "dur": 28.211, + "args": { + "External id": 447531,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007926250.046, "dur": 26.301, + "args": { + "External id": 447532,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926254.133, "dur": 4.220, + "args": { + "External id": 447533,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007926259.884, "dur": 15.897, + "args": { + "External id": 447534,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007926281.289, "dur": 2.587, + "args": { + "External id": 447535,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007926282.717, "dur": 1.045, + "args": { + "External id": 447536,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007926292.717, "dur": 2.752, + "args": { + "External id": 447537,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007926293.965, "dur": 1.395, + "args": { + "External id": 447538,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007926298.260, "dur": 3.610, + "args": { + "External id": 447539,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007926298.900, "dur": 2.871, + "args": { + "External id": 447540,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007926327.768, "dur": 15.726, + "args": { + "External id": 447541,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007926357.655, "dur": 11.098, + "args": { + "External id": 447542,"Record function id": 0, "Ev Idx": 1077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007926360.215, "dur": 7.913, + "args": { + "External id": 447543,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007926362.370, "dur": 4.956, + "args": { + "External id": 447544,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007926365.555, "dur": 1.620, + "args": { + "External id": 447545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926372.564, "dur": 7.473, + "args": { + "External id": 447546,"Record function id": 0, "Sequence number": 5285487, "Fwd thread id": 1, "Ev Idx": 1081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926373.712, "dur": 3.692, + "args": { + "External id": 447547,"Sequence number": 5285487, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1082 + } + }, + { + "ph": "f", "id": 113, "pid": 4183441, "tid": 31362, "ts": 676007926373.712, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007926375.256, "dur": 1.918, + "args": { + "External id": 447548,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007926376.095, "dur": 0.979, + "args": { + "External id": 447549,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926383.284, "dur": 185.291, + "args": { + "External id": 447550,"Record function id": 0, "Sequence number": 5285486, "Fwd thread id": 1, "Ev Idx": 1085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926384.427, "dur": 174.975, + "args": { + "External id": 447551,"Sequence number": 5285486, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1086 + } + }, + { + "ph": "f", "id": 114, "pid": 4183441, "tid": 31362, "ts": 676007926384.427, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007926388.078, "dur": 6.897, + "args": { + "External id": 447552,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007926389.479, "dur": 4.894, + "args": { + "External id": 447553,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926393.245, "dur": 0.865, + "args": { + "External id": 447554,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007926395.903, "dur": 92.963, + "args": { + "External id": 447555,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007926489.866, "dur": 6.230, + "args": { + "External id": 447556,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007926490.712, "dur": 4.785, + "args": { + "External id": 447557,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926492.649, "dur": 2.683, + "args": { + "External id": 447558,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007926497.809, "dur": 5.655, + "args": { + "External id": 447559,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007926500.856, "dur": 2.159, + "args": { + "External id": 447560,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926502.615, "dur": 0.288, + "args": { + "External id": 447561,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007926504.003, "dur": 54.699, + "args": { + "External id": 447562,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926572.908, "dur": 9.297, + "args": { + "External id": 447563,"Record function id": 0, "Sequence number": 5285485, "Fwd thread id": 1, "Ev Idx": 1098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926573.844, "dur": 6.327, + "args": { + "External id": 447564,"Sequence number": 5285485, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1099 + } + }, + { + "ph": "f", "id": 115, "pid": 4183441, "tid": 31362, "ts": 676007926573.844, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007926575.634, "dur": 4.388, + "args": { + "External id": 447565,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007926577.042, "dur": 2.885, + "args": { + "External id": 447566,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926585.516, "dur": 9.750, + "args": { + "External id": 447567,"Record function id": 0, "Sequence number": 5285484, "Fwd thread id": 1, "Ev Idx": 1102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926586.582, "dur": 6.565, + "args": { + "External id": 447568,"Sequence number": 5285484, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1103 + } + }, + { + "ph": "f", "id": 116, "pid": 4183441, "tid": 31362, "ts": 676007926586.582, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007926587.831, "dur": 5.117, + "args": { + "External id": 447569,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007926590.349, "dur": 2.078, + "args": { + "External id": 447570,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926591.917, "dur": 0.410, + "args": { + "External id": 447571,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007926599.185, "dur": 5.067, + "args": { + "External id": 447572,"Record function id": 0, "Ev Idx": 1107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007926600.686, "dur": 3.073, + "args": { + "External id": 447573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007926601.608, "dur": 1.893, + "args": { + "External id": 447574,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007926602.177, "dur": 1.245, + "args": { + "External id": 447575,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926609.232, "dur": 7.733, + "args": { + "External id": 447576,"Record function id": 0, "Sequence number": 5285483, "Fwd thread id": 1, "Ev Idx": 1111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007926610.178, "dur": 3.851, + "args": { + "External id": 447577,"Sequence number": 5285483, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1112 + } + }, + { + "ph": "f", "id": 117, "pid": 4183441, "tid": 31362, "ts": 676007926610.178, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007926611.811, "dur": 2.069, + "args": { + "External id": 447578,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007926612.700, "dur": 1.046, + "args": { + "External id": 447579,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007926621.304, "dur": 344.564, + "args": { + "External id": 447580,"Record function id": 0, "Sequence number": 5285482, "Fwd thread id": 1, "Ev Idx": 1115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007926622.861, "dur": 321.779, + "args": { + "External id": 447581,"Sequence number": 5285482, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1116 + } + }, + { + "ph": "f", "id": 118, "pid": 4183441, "tid": 31362, "ts": 676007926622.861, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007926639.333, "dur": 6.619, + "args": { + "External id": 447582,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926642.460, "dur": 3.164, + "args": { + "External id": 447583,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007926648.293, "dur": 5.056, + "args": { + "External id": 447584,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926650.013, "dur": 3.157, + "args": { + "External id": 447585,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007926711.323, "dur": 7.374, + "args": { + "External id": 447586,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007926714.963, "dur": 3.278, + "args": { + "External id": 447587,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676007926747.050, "dur": 170.840, + "args": { + "External id": 447588,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007926820.294, "dur": 5.614, + "args": { + "External id": 447589,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007926827.557, "dur": 4.199, + "args": { + "External id": 447590,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007926930.699, "dur": 4.016, + "args": { + "External id": 447591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007926937.836, "dur": 0.868, + "args": { + "External id": 447592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007926940.764, "dur": 0.628, + "args": { + "External id": 447593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007926976.921, "dur": 246.797, + "args": { + "External id": 447594,"Record function id": 0, "Sequence number": 5285481, "Fwd thread id": 1, "Ev Idx": 1129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007926979.201, "dur": 236.190, + "args": { + "External id": 447595,"Sequence number": 5285481, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1130 + } + }, + { + "ph": "f", "id": 119, "pid": 4183441, "tid": 31362, "ts": 676007926979.201, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007926999.488, "dur": 40.923, + "args": { + "External id": 447596,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927002.643, "dur": 2.821, + "args": { + "External id": 447597,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007927006.749, "dur": 33.092, + "args": { + "External id": 447598,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007927050.075, "dur": 5.672, + "args": { + "External id": 447599,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927052.221, "dur": 3.175, + "args": { + "External id": 447600,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007927233.598, "dur": 157.189, + "args": { + "External id": 447601,"Record function id": 0, "Sequence number": 5285480, "Fwd thread id": 1, "Ev Idx": 1136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007927235.616, "dur": 148.315, + "args": { + "External id": 447602,"Sequence number": 5285480, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1137 + } + }, + { + "ph": "f", "id": 120, "pid": 4183441, "tid": 31362, "ts": 676007927235.616, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007927249.049, "dur": 37.713, + "args": { + "External id": 447603,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927252.070, "dur": 3.740, + "args": { + "External id": 447604,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007927260.970, "dur": 25.203, + "args": { + "External id": 447605,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007927294.540, "dur": 4.717, + "args": { + "External id": 447606,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927296.490, "dur": 2.459, + "args": { + "External id": 447607,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927397.138, "dur": 16.633, + "args": { + "External id": 447608,"Record function id": 0, "Sequence number": 5285479, "Fwd thread id": 1, "Ev Idx": 1143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927398.670, "dur": 12.044, + "args": { + "External id": 447609,"Sequence number": 5285479, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1144 + } + }, + { + "ph": "f", "id": 121, "pid": 4183441, "tid": 31362, "ts": 676007927398.670, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927401.425, "dur": 9.012, + "args": { + "External id": 447610,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927403.007, "dur": 7.231, + "args": { + "External id": 447611,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927417.315, "dur": 8.878, + "args": { + "External id": 447612,"Record function id": 0, "Sequence number": 5285478, "Fwd thread id": 1, "Ev Idx": 1147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927420.214, "dur": 4.232, + "args": { + "External id": 447613,"Sequence number": 5285478, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1148 + } + }, + { + "ph": "f", "id": 122, "pid": 4183441, "tid": 31362, "ts": 676007927420.214, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927421.886, "dur": 2.421, + "args": { + "External id": 447614,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927423.059, "dur": 1.132, + "args": { + "External id": 447615,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927429.261, "dur": 6.763, + "args": { + "External id": 447616,"Record function id": 0, "Sequence number": 5285477, "Fwd thread id": 1, "Ev Idx": 1151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927430.116, "dur": 3.550, + "args": { + "External id": 447617,"Sequence number": 5285477, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1152 + } + }, + { + "ph": "f", "id": 123, "pid": 4183441, "tid": 31362, "ts": 676007927430.116, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927431.462, "dur": 2.065, + "args": { + "External id": 447618,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927432.561, "dur": 0.841, + "args": { + "External id": 447619,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927439.773, "dur": 9.736, + "args": { + "External id": 447620,"Record function id": 0, "Sequence number": 5285476, "Fwd thread id": 1, "Ev Idx": 1155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927441.254, "dur": 5.426, + "args": { + "External id": 447621,"Sequence number": 5285476, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1156 + } + }, + { + "ph": "f", "id": 124, "pid": 4183441, "tid": 31362, "ts": 676007927441.254, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927442.603, "dur": 3.932, + "args": { + "External id": 447622,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927445.480, "dur": 0.916, + "args": { + "External id": 447623,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927453.149, "dur": 163.039, + "args": { + "External id": 447624,"Record function id": 0, "Sequence number": 5285475, "Fwd thread id": 1, "Ev Idx": 1159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927453.984, "dur": 154.178, + "args": { + "External id": 447625,"Sequence number": 5285475, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1160 + } + }, + { + "ph": "f", "id": 125, "pid": 4183441, "tid": 31362, "ts": 676007927453.984, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927459.957, "dur": 7.316, + "args": { + "External id": 447626,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927461.873, "dur": 4.650, + "args": { + "External id": 447627,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927464.562, "dur": 1.651, + "args": { + "External id": 447628,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007927468.967, "dur": 80.631, + "args": { + "External id": 447629,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927553.185, "dur": 4.634, + "args": { + "External id": 447630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927554.132, "dur": 2.767, + "args": { + "External id": 447631,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927555.678, "dur": 1.082, + "args": { + "External id": 447632,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927560.327, "dur": 3.861, + "args": { + "External id": 447633,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927561.824, "dur": 1.928, + "args": { + "External id": 447634,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927563.323, "dur": 0.365, + "args": { + "External id": 447635,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007927566.710, "dur": 40.591, + "args": { + "External id": 447636,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927623.426, "dur": 7.915, + "args": { + "External id": 447637,"Record function id": 0, "Sequence number": 5285474, "Fwd thread id": 1, "Ev Idx": 1172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927624.547, "dur": 4.500, + "args": { + "External id": 447638,"Sequence number": 5285474, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1173 + } + }, + { + "ph": "f", "id": 126, "pid": 4183441, "tid": 31362, "ts": 676007927624.547, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927626.359, "dur": 2.545, + "args": { + "External id": 447639,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927627.707, "dur": 1.083, + "args": { + "External id": 447640,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927634.562, "dur": 10.182, + "args": { + "External id": 447641,"Record function id": 0, "Sequence number": 5285473, "Fwd thread id": 1, "Ev Idx": 1176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927635.549, "dur": 6.622, + "args": { + "External id": 447642,"Sequence number": 5285473, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1177 + } + }, + { + "ph": "f", "id": 127, "pid": 4183441, "tid": 31362, "ts": 676007927635.549, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927636.530, "dur": 5.424, + "args": { + "External id": 447643,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927637.132, "dur": 4.328, + "args": { + "External id": 447644,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927641.033, "dur": 0.334, + "args": { + "External id": 447645,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007927650.823, "dur": 51.620, + "args": { + "External id": 447646,"Record function id": 0, "Ev Idx": 1181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007927652.763, "dur": 48.247, + "args": { + "External id": 447647,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007927695.722, "dur": 4.749, + "args": { + "External id": 447648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007927697.131, "dur": 3.056, + "args": { + "External id": 447649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927707.574, "dur": 9.381, + "args": { + "External id": 447650,"Record function id": 0, "Sequence number": 5285472, "Fwd thread id": 1, "Ev Idx": 1185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927709.643, "dur": 4.668, + "args": { + "External id": 447651,"Sequence number": 5285472, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1186 + } + }, + { + "ph": "f", "id": 128, "pid": 4183441, "tid": 31362, "ts": 676007927709.643, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927711.446, "dur": 2.698, + "args": { + "External id": 447652,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927712.349, "dur": 1.700, + "args": { + "External id": 447653,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927720.427, "dur": 110.935, + "args": { + "External id": 447654,"Record function id": 0, "Sequence number": 5285471, "Fwd thread id": 1, "Ev Idx": 1189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927721.320, "dur": 101.989, + "args": { + "External id": 447655,"Sequence number": 5285471, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1190 + } + }, + { + "ph": "f", "id": 129, "pid": 4183441, "tid": 31362, "ts": 676007927721.320, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927726.922, "dur": 4.843, + "args": { + "External id": 447656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927727.901, "dur": 3.421, + "args": { + "External id": 447657,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927730.352, "dur": 0.850, + "args": { + "External id": 447658,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007927732.592, "dur": 41.933, + "args": { + "External id": 447659,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927775.613, "dur": 4.163, + "args": { + "External id": 447660,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927776.290, "dur": 2.862, + "args": { + "External id": 447661,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927778.124, "dur": 0.907, + "args": { + "External id": 447662,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927782.713, "dur": 5.938, + "args": { + "External id": 447663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927784.343, "dur": 3.615, + "args": { + "External id": 447664,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927785.661, "dur": 2.205, + "args": { + "External id": 447665,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007927789.304, "dur": 33.170, + "args": { + "External id": 447666,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927835.994, "dur": 34.716, + "args": { + "External id": 447667,"Record function id": 0, "Sequence number": 5285470, "Fwd thread id": 1, "Ev Idx": 1202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927836.917, "dur": 6.395, + "args": { + "External id": 447668,"Sequence number": 5285470, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1203 + } + }, + { + "ph": "f", "id": 130, "pid": 4183441, "tid": 31362, "ts": 676007927836.917, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927838.882, "dur": 4.290, + "args": { + "External id": 447669,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927841.845, "dur": 1.228, + "args": { + "External id": 447670,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007927846.557, "dur": 21.574, + "args": { + "External id": 447671,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927874.329, "dur": 11.704, + "args": { + "External id": 447672,"Record function id": 0, "Sequence number": 5285469, "Fwd thread id": 1, "Ev Idx": 1207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927875.567, "dur": 5.199, + "args": { + "External id": 447673,"Sequence number": 5285469, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1208 + } + }, + { + "ph": "f", "id": 131, "pid": 4183441, "tid": 31362, "ts": 676007927875.567, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927876.653, "dur": 3.884, + "args": { + "External id": 447674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927877.318, "dur": 2.617, + "args": { + "External id": 447675,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927879.028, "dur": 0.812, + "args": { + "External id": 447676,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007927890.270, "dur": 8.112, + "args": { + "External id": 447677,"Record function id": 0, "Ev Idx": 1212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007927892.446, "dur": 5.451, + "args": { + "External id": 447678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007927893.599, "dur": 3.815, + "args": { + "External id": 447679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007927895.691, "dur": 1.613, + "args": { + "External id": 447680,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927901.645, "dur": 9.608, + "args": { + "External id": 447681,"Record function id": 0, "Sequence number": 5285468, "Fwd thread id": 1, "Ev Idx": 1216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927902.817, "dur": 5.598, + "args": { + "External id": 447682,"Sequence number": 5285468, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1217 + } + }, + { + "ph": "f", "id": 132, "pid": 4183441, "tid": 31362, "ts": 676007927902.817, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007927903.999, "dur": 4.258, + "args": { + "External id": 447683,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007927906.782, "dur": 1.379, + "args": { + "External id": 447684,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927914.295, "dur": 102.576, + "args": { + "External id": 447685,"Record function id": 0, "Sequence number": 5285467, "Fwd thread id": 1, "Ev Idx": 1220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007927915.524, "dur": 91.912, + "args": { + "External id": 447686,"Sequence number": 5285467, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1221 + } + }, + { + "ph": "f", "id": 133, "pid": 4183441, "tid": 31362, "ts": 676007927915.524, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927919.710, "dur": 3.200, + "args": { + "External id": 447687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927920.243, "dur": 2.229, + "args": { + "External id": 447688,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927921.997, "dur": 0.381, + "args": { + "External id": 447689,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007927923.673, "dur": 35.862, + "args": { + "External id": 447690,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927960.616, "dur": 7.246, + "args": { + "External id": 447691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927961.395, "dur": 5.792, + "args": { + "External id": 447692,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927964.778, "dur": 2.197, + "args": { + "External id": 447693,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007927969.121, "dur": 4.182, + "args": { + "External id": 447694,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007927970.497, "dur": 2.391, + "args": { + "External id": 447695,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007927972.262, "dur": 0.552, + "args": { + "External id": 447696,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007927973.867, "dur": 32.837, + "args": { + "External id": 447697,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928021.151, "dur": 26.312, + "args": { + "External id": 447698,"Record function id": 0, "Sequence number": 5285466, "Fwd thread id": 1, "Ev Idx": 1233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928022.251, "dur": 5.974, + "args": { + "External id": 447699,"Sequence number": 5285466, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1234 + } + }, + { + "ph": "f", "id": 134, "pid": 4183441, "tid": 31362, "ts": 676007928022.251, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928023.985, "dur": 4.089, + "args": { + "External id": 447700,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928026.658, "dur": 1.285, + "args": { + "External id": 447701,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007928030.540, "dur": 14.712, + "args": { + "External id": 447702,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928050.798, "dur": 7.896, + "args": { + "External id": 447703,"Record function id": 0, "Sequence number": 5285465, "Fwd thread id": 1, "Ev Idx": 1238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928051.890, "dur": 5.137, + "args": { + "External id": 447704,"Sequence number": 5285465, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1239 + } + }, + { + "ph": "f", "id": 135, "pid": 4183441, "tid": 31362, "ts": 676007928051.890, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007928053.131, "dur": 3.676, + "args": { + "External id": 447705,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007928053.712, "dur": 2.526, + "args": { + "External id": 447706,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928055.660, "dur": 0.456, + "args": { + "External id": 447707,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007928062.864, "dur": 5.473, + "args": { + "External id": 447708,"Record function id": 0, "Ev Idx": 1243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007928064.925, "dur": 2.950, + "args": { + "External id": 447709,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007928065.816, "dur": 1.752, + "args": { + "External id": 447710,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007928066.475, "dur": 0.993, + "args": { + "External id": 447711,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007928074.635, "dur": 363.977, + "args": { + "External id": 447712,"Record function id": 0, "Sequence number": 5285464, "Fwd thread id": 1, "Ev Idx": 1247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007928076.278, "dur": 333.436, + "args": { + "External id": 447713,"Sequence number": 5285464, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1248 + } + }, + { + "ph": "f", "id": 136, "pid": 4183441, "tid": 31362, "ts": 676007928076.278, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928129.672, "dur": 3.120, + "args": { + "External id": 447714,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928130.711, "dur": 1.842, + "args": { + "External id": 447715,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007928146.887, "dur": 6.407, + "args": { + "External id": 447716,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007928162.291, "dur": 2.939, + "args": { + "External id": 447717,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928310.639, "dur": 1.909, + "args": { + "External id": 447718,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007928316.591, "dur": 33.068, + "args": { + "External id": 447719,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928325.685, "dur": 1.021, + "args": { + "External id": 447720,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007928355.391, "dur": 30.266, + "args": { + "External id": 447721,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007928359.446, "dur": 25.961, + "args": { + "External id": 447722,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928363.815, "dur": 3.980, + "args": { + "External id": 447723,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007928369.222, "dur": 15.739, + "args": { + "External id": 447724,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007928390.083, "dur": 2.574, + "args": { + "External id": 447725,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928391.476, "dur": 1.087, + "args": { + "External id": 447726,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928398.475, "dur": 4.400, + "args": { + "External id": 447727,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928401.719, "dur": 1.065, + "args": { + "External id": 447728,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007928420.385, "dur": 14.752, + "args": { + "External id": 447729,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007928450.081, "dur": 8.409, + "args": { + "External id": 447730,"Record function id": 0, "Ev Idx": 1265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007928452.539, "dur": 5.287, + "args": { + "External id": 447731,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007928454.399, "dur": 2.438, + "args": { + "External id": 447732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007928455.271, "dur": 1.475, + "args": { + "External id": 447733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928462.464, "dur": 7.110, + "args": { + "External id": 447734,"Record function id": 0, "Sequence number": 5285463, "Fwd thread id": 1, "Ev Idx": 1269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928464.265, "dur": 1.362, + "args": { + "External id": 447735,"Sequence number": 5285463, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1270 + } + }, + { + "ph": "f", "id": 137, "pid": 4183441, "tid": 31362, "ts": 676007928464.265, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007928473.482, "dur": 429.251, + "args": { + "External id": 447736,"Record function id": 0, "Sequence number": 5285462, "Fwd thread id": 1, "Ev Idx": 1271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007928475.352, "dur": 414.865, + "args": { + "External id": 447737,"Sequence number": 5285462, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1272 + } + }, + { + "ph": "f", "id": 138, "pid": 4183441, "tid": 31362, "ts": 676007928475.352, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928506.400, "dur": 8.901, + "args": { + "External id": 447738,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007928512.136, "dur": 2.876, + "args": { + "External id": 447739,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]", "[4096, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[16777216, 4096, 1], [], []], "Input Dims": [[16, 4096, 1024], [], []], "Ev Idx": 1274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007928518.157, "dur": 4.817, + "args": { + "External id": 447740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007928519.629, "dur": 2.747, + "args": { + "External id": 447741,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928521.519, "dur": 0.657, + "args": { + "External id": 447742,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 31362, + "ts": 676007928526.520, "dur": 79.276, + "args": { + "External id": 447743,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4096, 1], [1, 2816], []], "Input Dims": [[65536, 1024], [2816, 1024], []], "Ev Idx": 1278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007928529.275, "dur": 5.146, + "args": { + "External id": 447744,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2816]], "Input Dims": [[2816, 1024]], "Ev Idx": 1279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007928529.846, "dur": 4.126, + "args": { + "External id": 447745,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2816], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928531.318, "dur": 2.587, + "args": { + "External id": 447746,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[2816, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2816], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 31362, + "ts": 676007928535.743, "dur": 69.560, + "args": { + "External id": 447747,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 1282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007928537.023, "dur": 67.675, + "args": { + "External id": 447748,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4096, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 1283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007928609.245, "dur": 2.890, + "args": { + "External id": 447749,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [11534336, 2816, 1]], "Input Dims": [[65536, 2816], [16, 4096, 2816]], "Ev Idx": 1284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928610.827, "dur": 1.164, + "args": { + "External id": 447750,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 1285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007928642.635, "dur": 4.942, + "args": { + "External id": 447751,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007928648.940, "dur": 2.175, + "args": { + "External id": 447752,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007928652.085, "dur": 1.936, + "args": { + "External id": 447753,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928727.795, "dur": 3.102, + "args": { + "External id": 447754,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928728.617, "dur": 2.050, + "args": { + "External id": 447755,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 4183441, "tid": 31362, + "ts": 676007928753.470, "dur": 117.979, + "args": { + "External id": 447756,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[4096, 1], [2816, 1]], []], "Input Dims": [[], [[65536, 1024], [65536, 2816]], []], "Ev Idx": 1291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007928758.408, "dur": 8.095, + "args": { + "External id": 447757,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928763.031, "dur": 2.648, + "args": { + "External id": 447758,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024, 1]", "[4096, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007928768.457, "dur": 6.918, + "args": { + "External id": 447759,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4096, 1, 1], []], "Input Dims": [[65536, 1024, 1], []], "Ev Idx": 1294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928771.813, "dur": 2.659, + "args": { + "External id": 447760,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 65536]", "[1, 1, 4096]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 1], [], [], []], "Input Dims": [[65536, 1024, 1], [], [], []], "Ev Idx": 1295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 31362, + "ts": 676007928776.741, "dur": 2.988, + "args": { + "External id": 447761,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 1296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928778.656, "dur": 0.717, + "args": { + "External id": 447762,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007928780.845, "dur": 3.082, + "args": { + "External id": 447763,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 1298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928782.703, "dur": 0.613, + "args": { + "External id": 447764,"Record function id": 0, "Concrete Inputs": ["", "[1, 2816, 65536]", "[1, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1, 1], [], [], []], "Input Dims": [[65536, 2816, 1], [], [], []], "Ev Idx": 1299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007928787.904, "dur": 3.470, + "args": { + "External id": 447765,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 4096], []], "Input Dims": [[1024, 1, 65536], []], "Ev Idx": 1300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928790.396, "dur": 0.668, + "args": { + "External id": 447766,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536, 1]", "[1, 4096, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 4096], [], [], []], "Input Dims": [[1024, 1, 65536], [], [], []], "Ev Idx": 1301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928792.564, "dur": 6.608, + "args": { + "External id": 447767,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 4096, 1], []], "Input Dims": [[1024, 65536, 1], []], "Ev Idx": 1302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 4183441, "tid": 31362, + "ts": 676007928796.601, "dur": 2.400, + "args": { + "External id": 447768,"Record function id": 0, "Concrete Inputs": ["", "[1, 1024, 65536]", "[1024, 1, 4096]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 4096, 1], [], []], "Input Dims": [[1024, 65536, 1], [], []], "Ev Idx": 1303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007928802.065, "dur": 2.941, + "args": { + "External id": 447769,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 2816], []], "Input Dims": [[1, 2816, 65536], []], "Ev Idx": 1304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928804.179, "dur": 0.500, + "args": { + "External id": 447770,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816, 1]", "[2816, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 2816], [], [], []], "Input Dims": [[1, 2816, 65536], [], [], []], "Ev Idx": 1305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928805.861, "dur": 4.118, + "args": { + "External id": 447771,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 1306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928806.755, "dur": 3.117, + "args": { + "External id": 447772,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 1], []], "Input Dims": [[65536, 2816, 1], []], "Ev Idx": 1307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676007928811.187, "dur": 46.509, + "args": { + "External id": 447773,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1, 4096], [184549376, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816]], "Ev Idx": 1308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928859.696, "dur": 3.173, + "args": { + "External id": 447774,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2883584, 2816, 1], []], "Input Dims": [[1, 1024, 2816], []], "Ev Idx": 1309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 4183441, "tid": 31362, + "ts": 676007928863.844, "dur": 3.332, + "args": { + "External id": 447775,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 2816, 1], []], "Input Dims": [[1024, 1, 2816], []], "Ev Idx": 1310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928866.129, "dur": 0.471, + "args": { + "External id": 447776,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816, 1]", "[2816, 1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 2816, 1], [], [], []], "Input Dims": [[1024, 1, 2816], [], [], []], "Ev Idx": 1311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928869.372, "dur": 1.130, + "args": { + "External id": 447777,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1, 2816], []], "Input Dims": [[1024, 2816, 1], []], "Ev Idx": 1312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007928913.694, "dur": 9.249, + "args": { + "External id": 447778,"Record function id": 0, "Ev Idx": 1313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007928916.391, "dur": 5.895, + "args": { + "External id": 447779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007928918.481, "dur": 2.863, + "args": { + "External id": 447780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007928919.421, "dur": 1.830, + "args": { + "External id": 447781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928926.405, "dur": 8.308, + "args": { + "External id": 447782,"Record function id": 0, "Sequence number": 5285461, "Fwd thread id": 1, "Ev Idx": 1317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928927.967, "dur": 4.213, + "args": { + "External id": 447783,"Sequence number": 5285461, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 1318 + } + }, + { + "ph": "f", "id": 139, "pid": 4183441, "tid": 31362, "ts": 676007928927.967, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007928930.289, "dur": 1.617, + "args": { + "External id": 447784,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007928931.067, "dur": 0.707, + "args": { + "External id": 447785,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928938.005, "dur": 109.416, + "args": { + "External id": 447786,"Record function id": 0, "Sequence number": 5285460, "Fwd thread id": 1, "Ev Idx": 1321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007928938.811, "dur": 101.723, + "args": { + "External id": 447787,"Sequence number": 5285460, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1322 + } + }, + { + "ph": "f", "id": 140, "pid": 4183441, "tid": 31362, "ts": 676007928938.811, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007928945.187, "dur": 5.059, + "args": { + "External id": 447788,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007928946.818, "dur": 2.871, + "args": { + "External id": 447789,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 1324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928948.960, "dur": 0.580, + "args": { + "External id": 447790,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007928951.304, "dur": 33.640, + "args": { + "External id": 447791,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 1326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007928985.987, "dur": 5.974, + "args": { + "External id": 447792,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007928986.934, "dur": 4.243, + "args": { + "External id": 447793,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928989.842, "dur": 1.153, + "args": { + "External id": 447794,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007928993.781, "dur": 4.507, + "args": { + "External id": 447795,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007928995.353, "dur": 2.334, + "args": { + "External id": 447796,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007928997.014, "dur": 0.594, + "args": { + "External id": 447797,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007928998.926, "dur": 40.755, + "args": { + "External id": 447798,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929051.954, "dur": 8.698, + "args": { + "External id": 447799,"Record function id": 0, "Sequence number": 5285459, "Fwd thread id": 1, "Ev Idx": 1334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929052.886, "dur": 5.956, + "args": { + "External id": 447800,"Sequence number": 5285459, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1335 + } + }, + { + "ph": "f", "id": 141, "pid": 4183441, "tid": 31362, "ts": 676007929052.886, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929054.636, "dur": 4.064, + "args": { + "External id": 447801,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929057.315, "dur": 1.276, + "args": { + "External id": 447802,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929063.952, "dur": 7.713, + "args": { + "External id": 447803,"Record function id": 0, "Sequence number": 5285458, "Fwd thread id": 1, "Ev Idx": 1338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929064.765, "dur": 4.907, + "args": { + "External id": 447804,"Sequence number": 5285458, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1339 + } + }, + { + "ph": "f", "id": 142, "pid": 4183441, "tid": 31362, "ts": 676007929064.765, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929065.685, "dur": 3.773, + "args": { + "External id": 447805,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929066.260, "dur": 2.725, + "args": { + "External id": 447806,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929068.011, "dur": 0.884, + "args": { + "External id": 447807,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929075.327, "dur": 5.424, + "args": { + "External id": 447808,"Record function id": 0, "Ev Idx": 1343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929076.732, "dur": 3.500, + "args": { + "External id": 447809,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007929077.977, "dur": 2.007, + "args": { + "External id": 447810,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007929078.751, "dur": 1.148, + "args": { + "External id": 447811,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929100.861, "dur": 10.252, + "args": { + "External id": 447812,"Record function id": 0, "Sequence number": 5285457, "Fwd thread id": 1, "Ev Idx": 1347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929102.854, "dur": 5.906, + "args": { + "External id": 447813,"Sequence number": 5285457, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[11534336, 2816, 1]], "Input Dims": [[16, 4096, 2816]], "Ev Idx": 1348 + } + }, + { + "ph": "f", "id": 143, "pid": 4183441, "tid": 31362, "ts": 676007929102.854, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929106.455, "dur": 2.144, + "args": { + "External id": 447814,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929107.119, "dur": 1.304, + "args": { + "External id": 447815,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 1350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929114.203, "dur": 97.680, + "args": { + "External id": 447816,"Record function id": 0, "Sequence number": 5285456, "Fwd thread id": 1, "Ev Idx": 1351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929115.309, "dur": 87.530, + "args": { + "External id": 447817,"Sequence number": 5285456, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1352 + } + }, + { + "ph": "f", "id": 144, "pid": 4183441, "tid": 31362, "ts": 676007929115.309, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929119.094, "dur": 4.620, + "args": { + "External id": 447818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[65536, 2816]], "Ev Idx": 1353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929119.763, "dur": 3.513, + "args": { + "External id": 447819,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[65536, 2816], [], []], "Ev Idx": 1354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929122.589, "dur": 0.550, + "args": { + "External id": 447820,"Record function id": 0, "Concrete Inputs": ["", "[2816, 65536]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[65536, 2816], [], [], []], "Ev Idx": 1355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007929124.415, "dur": 31.150, + "args": { + "External id": 447821,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024]], "Ev Idx": 1356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929156.373, "dur": 4.145, + "args": { + "External id": 447822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929156.959, "dur": 2.997, + "args": { + "External id": 447823,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 1358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929158.585, "dur": 1.204, + "args": { + "External id": 447824,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 1359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929161.869, "dur": 6.894, + "args": { + "External id": 447825,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929163.658, "dur": 4.714, + "args": { + "External id": 447826,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929166.622, "dur": 1.665, + "args": { + "External id": 447827,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007929169.465, "dur": 32.647, + "args": { + "External id": 447828,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 1363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929217.474, "dur": 30.998, + "args": { + "External id": 447829,"Record function id": 0, "Sequence number": 5285455, "Fwd thread id": 1, "Ev Idx": 1364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929218.371, "dur": 4.883, + "args": { + "External id": 447830,"Sequence number": 5285455, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1365 + } + }, + { + "ph": "f", "id": 145, "pid": 4183441, "tid": 31362, "ts": 676007929218.371, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929220.325, "dur": 2.788, + "args": { + "External id": 447831,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929221.569, "dur": 1.416, + "args": { + "External id": 447832,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007929225.847, "dur": 19.581, + "args": { + "External id": 447833,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929251.971, "dur": 10.275, + "args": { + "External id": 447834,"Record function id": 0, "Sequence number": 5285454, "Fwd thread id": 1, "Ev Idx": 1369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929253.013, "dur": 6.795, + "args": { + "External id": 447835,"Sequence number": 5285454, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1370 + } + }, + { + "ph": "f", "id": 146, "pid": 4183441, "tid": 31362, "ts": 676007929253.013, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929254.235, "dur": 5.340, + "args": { + "External id": 447836,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 2816]], "Ev Idx": 1371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929255.191, "dur": 3.840, + "args": { + "External id": 447837,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 1372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929258.146, "dur": 0.794, + "args": { + "External id": 447838,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 1373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929266.278, "dur": 6.314, + "args": { + "External id": 447839,"Record function id": 0, "Ev Idx": 1374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929268.602, "dur": 3.534, + "args": { + "External id": 447840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007929269.753, "dur": 1.926, + "args": { + "External id": 447841,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007929270.445, "dur": 1.146, + "args": { + "External id": 447842,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007929276.646, "dur": 444.457, + "args": { + "External id": 447843,"Record function id": 0, "Sequence number": 5285453, "Fwd thread id": 1, "Ev Idx": 1378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007929282.027, "dur": 360.385, + "args": { + "External id": 447844,"Sequence number": 5285453, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 1379 + } + }, + { + "ph": "f", "id": 147, "pid": 4183441, "tid": 31362, "ts": 676007929282.027, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 31362, + "ts": 676007929304.369, "dur": 33.181, + "args": { + "External id": 447845,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007929305.888, "dur": 31.474, + "args": { + "External id": 447846,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007929308.914, "dur": 5.914, + "args": { + "External id": 447847,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], [], []], "Ev Idx": 1382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007929311.431, "dur": 2.919, + "args": { + "External id": 447848,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007929316.157, "dur": 20.654, + "args": { + "External id": 447849,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929350.630, "dur": 2.285, + "args": { + "External id": 447850,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929351.535, "dur": 1.240, + "args": { + "External id": 447851,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929356.821, "dur": 3.358, + "args": { + "External id": 447852,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929357.586, "dur": 2.507, + "args": { + "External id": 447853,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007929372.471, "dur": 2.692, + "args": { + "External id": 447854,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007929385.648, "dur": 4.322, + "args": { + "External id": 447855,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929538.577, "dur": 3.677, + "args": { + "External id": 447856,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007929546.372, "dur": 30.094, + "args": { + "External id": 447857,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929553.949, "dur": 0.936, + "args": { + "External id": 447858,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007929582.037, "dur": 29.472, + "args": { + "External id": 447859,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007929583.735, "dur": 27.562, + "args": { + "External id": 447860,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929587.748, "dur": 3.804, + "args": { + "External id": 447861,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007929594.696, "dur": 15.988, + "args": { + "External id": 447862,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007929615.343, "dur": 2.769, + "args": { + "External id": 447863,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929616.677, "dur": 1.296, + "args": { + "External id": 447864,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929624.234, "dur": 2.675, + "args": { + "External id": 447865,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929625.486, "dur": 1.327, + "args": { + "External id": 447866,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929629.570, "dur": 3.939, + "args": { + "External id": 447867,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929630.833, "dur": 2.579, + "args": { + "External id": 447868,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007929698.952, "dur": 19.982, + "args": { + "External id": 447869,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929733.847, "dur": 9.932, + "args": { + "External id": 447870,"Record function id": 0, "Ev Idx": 1405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929736.569, "dur": 6.514, + "args": { + "External id": 447871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007929738.743, "dur": 3.202, + "args": { + "External id": 447872,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007929739.554, "dur": 2.266, + "args": { + "External id": 447873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929747.307, "dur": 8.844, + "args": { + "External id": 447874,"Record function id": 0, "Sequence number": 5285452, "Fwd thread id": 1, "Ev Idx": 1409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929748.584, "dur": 4.531, + "args": { + "External id": 447875,"Sequence number": 5285452, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1410 + } + }, + { + "ph": "f", "id": 148, "pid": 4183441, "tid": 31362, "ts": 676007929748.584, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929750.229, "dur": 2.665, + "args": { + "External id": 447876,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929751.169, "dur": 1.595, + "args": { + "External id": 447877,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929761.243, "dur": 134.014, + "args": { + "External id": 447878,"Record function id": 0, "Sequence number": 5285451, "Fwd thread id": 1, "Ev Idx": 1413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929762.443, "dur": 126.015, + "args": { + "External id": 447879,"Sequence number": 5285451, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1414 + } + }, + { + "ph": "f", "id": 149, "pid": 4183441, "tid": 31362, "ts": 676007929762.443, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929766.688, "dur": 5.323, + "args": { + "External id": 447880,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929768.411, "dur": 2.940, + "args": { + "External id": 447881,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929770.311, "dur": 0.855, + "args": { + "External id": 447882,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007929773.099, "dur": 65.607, + "args": { + "External id": 447883,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929839.856, "dur": 7.206, + "args": { + "External id": 447884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929842.333, "dur": 3.962, + "args": { + "External id": 447885,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929844.030, "dur": 2.058, + "args": { + "External id": 447886,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929848.448, "dur": 3.863, + "args": { + "External id": 447887,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929849.846, "dur": 1.987, + "args": { + "External id": 447888,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929851.244, "dur": 0.495, + "args": { + "External id": 447889,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007929852.961, "dur": 34.763, + "args": { + "External id": 447890,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929900.086, "dur": 12.014, + "args": { + "External id": 447891,"Record function id": 0, "Sequence number": 5285450, "Fwd thread id": 1, "Ev Idx": 1426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929901.213, "dur": 8.067, + "args": { + "External id": 447892,"Sequence number": 5285450, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1427 + } + }, + { + "ph": "f", "id": 150, "pid": 4183441, "tid": 31362, "ts": 676007929901.213, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929904.732, "dur": 4.376, + "args": { + "External id": 447893,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929905.821, "dur": 3.152, + "args": { + "External id": 447894,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929915.430, "dur": 8.085, + "args": { + "External id": 447895,"Record function id": 0, "Sequence number": 5285449, "Fwd thread id": 1, "Ev Idx": 1430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929916.806, "dur": 4.343, + "args": { + "External id": 447896,"Sequence number": 5285449, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1431 + } + }, + { + "ph": "f", "id": 151, "pid": 4183441, "tid": 31362, "ts": 676007929916.806, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007929917.489, "dur": 3.465, + "args": { + "External id": 447897,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007929918.230, "dur": 2.223, + "args": { + "External id": 447898,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929919.810, "dur": 0.470, + "args": { + "External id": 447899,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929927.282, "dur": 7.356, + "args": { + "External id": 447900,"Record function id": 0, "Ev Idx": 1435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007929929.188, "dur": 4.962, + "args": { + "External id": 447901,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007929930.138, "dur": 3.798, + "args": { + "External id": 447902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007929932.656, "dur": 1.174, + "args": { + "External id": 447903,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929937.482, "dur": 7.215, + "args": { + "External id": 447904,"Record function id": 0, "Sequence number": 5285448, "Fwd thread id": 1, "Ev Idx": 1439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007929938.541, "dur": 3.632, + "args": { + "External id": 447905,"Sequence number": 5285448, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1440 + } + }, + { + "ph": "f", "id": 152, "pid": 4183441, "tid": 31362, "ts": 676007929938.541, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007929939.983, "dur": 2.045, + "args": { + "External id": 447906,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007929940.767, "dur": 1.114, + "args": { + "External id": 447907,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007929948.808, "dur": 307.807, + "args": { + "External id": 447908,"Record function id": 0, "Sequence number": 5285447, "Fwd thread id": 1, "Ev Idx": 1443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 4183441, "tid": 31362, + "ts": 676007929950.421, "dur": 283.563, + "args": { + "External id": 447909,"Sequence number": 5285447, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1444 + } + }, + { + "ph": "f", "id": 153, "pid": 4183441, "tid": 31362, "ts": 676007929950.421, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007929966.482, "dur": 7.705, + "args": { + "External id": 447910,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929969.490, "dur": 4.284, + "args": { + "External id": 447911,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007929976.427, "dur": 3.325, + "args": { + "External id": 447912,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929977.773, "dur": 1.799, + "args": { + "External id": 447913,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007929981.359, "dur": 3.209, + "args": { + "External id": 447914,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007929982.972, "dur": 1.421, + "args": { + "External id": 447915,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676007930008.714, "dur": 199.678, + "args": { + "External id": 447916,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007930107.721, "dur": 6.055, + "args": { + "External id": 447917,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007930115.955, "dur": 3.745, + "args": { + "External id": 447918,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007930221.185, "dur": 3.512, + "args": { + "External id": 447919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007930227.521, "dur": 0.896, + "args": { + "External id": 447920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 31362, + "ts": 676007930230.201, "dur": 0.824, + "args": { + "External id": 447921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007930266.022, "dur": 227.157, + "args": { + "External id": 447922,"Record function id": 0, "Sequence number": 5285446, "Fwd thread id": 1, "Ev Idx": 1457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007930267.590, "dur": 218.394, + "args": { + "External id": 447923,"Sequence number": 5285446, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1458 + } + }, + { + "ph": "f", "id": 154, "pid": 4183441, "tid": 31362, "ts": 676007930267.590, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007930287.310, "dur": 47.886, + "args": { + "External id": 447924,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930290.643, "dur": 3.193, + "args": { + "External id": 447925,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007930295.182, "dur": 39.379, + "args": { + "External id": 447926,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007930345.119, "dur": 4.558, + "args": { + "External id": 447927,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930347.238, "dur": 2.109, + "args": { + "External id": 447928,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007930499.762, "dur": 142.490, + "args": { + "External id": 447929,"Record function id": 0, "Sequence number": 5285445, "Fwd thread id": 1, "Ev Idx": 1464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007930501.949, "dur": 134.559, + "args": { + "External id": 447930,"Sequence number": 5285445, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1465 + } + }, + { + "ph": "f", "id": 155, "pid": 4183441, "tid": 31362, "ts": 676007930501.949, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 31362, + "ts": 676007930513.163, "dur": 31.501, + "args": { + "External id": 447931,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930515.493, "dur": 2.324, + "args": { + "External id": 447932,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007930518.862, "dur": 25.399, + "args": { + "External id": 447933,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], []], "Ev Idx": 1468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 31362, + "ts": 676007930551.489, "dur": 4.114, + "args": { + "External id": 447934,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 1469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930553.212, "dur": 2.091, + "args": { + "External id": 447935,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930648.209, "dur": 55.728, + "args": { + "External id": 447936,"Record function id": 0, "Sequence number": 5285444, "Fwd thread id": 1, "Ev Idx": 1471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930649.767, "dur": 49.317, + "args": { + "External id": 447937,"Sequence number": 5285444, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1472 + } + }, + { + "ph": "f", "id": 156, "pid": 4183441, "tid": 31362, "ts": 676007930649.767, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007930653.925, "dur": 44.859, + "args": { + "External id": 447938,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007930692.161, "dur": 6.296, + "args": { + "External id": 447939,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930709.471, "dur": 8.199, + "args": { + "External id": 447940,"Record function id": 0, "Sequence number": 5285443, "Fwd thread id": 1, "Ev Idx": 1475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930710.870, "dur": 4.179, + "args": { + "External id": 447941,"Sequence number": 5285443, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1476 + } + }, + { + "ph": "f", "id": 157, "pid": 4183441, "tid": 31362, "ts": 676007930710.870, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007930712.851, "dur": 2.058, + "args": { + "External id": 447942,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007930713.862, "dur": 0.935, + "args": { + "External id": 447943,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930720.929, "dur": 7.223, + "args": { + "External id": 447944,"Record function id": 0, "Sequence number": 5285442, "Fwd thread id": 1, "Ev Idx": 1479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930721.781, "dur": 4.275, + "args": { + "External id": 447945,"Sequence number": 5285442, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 1480 + } + }, + { + "ph": "f", "id": 158, "pid": 4183441, "tid": 31362, "ts": 676007930721.781, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007930723.321, "dur": 2.584, + "args": { + "External id": 447946,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007930724.475, "dur": 1.310, + "args": { + "External id": 447947,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 1482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930731.384, "dur": 9.213, + "args": { + "External id": 447948,"Record function id": 0, "Sequence number": 5285441, "Fwd thread id": 1, "Ev Idx": 1483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930732.935, "dur": 5.287, + "args": { + "External id": 447949,"Sequence number": 5285441, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1484 + } + }, + { + "ph": "f", "id": 159, "pid": 4183441, "tid": 31362, "ts": 676007930732.935, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007930736.215, "dur": 1.866, + "args": { + "External id": 447950,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007930736.926, "dur": 1.058, + "args": { + "External id": 447951,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930744.037, "dur": 154.535, + "args": { + "External id": 447952,"Record function id": 0, "Sequence number": 5285440, "Fwd thread id": 1, "Ev Idx": 1487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930744.907, "dur": 146.420, + "args": { + "External id": 447953,"Sequence number": 5285440, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1488 + } + }, + { + "ph": "f", "id": 160, "pid": 4183441, "tid": 31362, "ts": 676007930744.907, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007930748.914, "dur": 7.965, + "args": { + "External id": 447954,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007930750.577, "dur": 5.660, + "args": { + "External id": 447955,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930754.258, "dur": 1.670, + "args": { + "External id": 447956,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007930758.218, "dur": 79.333, + "args": { + "External id": 447957,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007930838.786, "dur": 4.962, + "args": { + "External id": 447958,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007930839.869, "dur": 3.027, + "args": { + "External id": 447959,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930841.682, "dur": 1.001, + "args": { + "External id": 447960,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007930845.334, "dur": 5.718, + "args": { + "External id": 447961,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007930846.890, "dur": 3.498, + "args": { + "External id": 447962,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930849.948, "dur": 0.374, + "args": { + "External id": 447963,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007930851.953, "dur": 38.579, + "args": { + "External id": 447964,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930903.136, "dur": 7.430, + "args": { + "External id": 447965,"Record function id": 0, "Sequence number": 5285439, "Fwd thread id": 1, "Ev Idx": 1500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930904.443, "dur": 4.082, + "args": { + "External id": 447966,"Sequence number": 5285439, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1501 + } + }, + { + "ph": "f", "id": 161, "pid": 4183441, "tid": 31362, "ts": 676007930904.443, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007930906.098, "dur": 2.283, + "args": { + "External id": 447967,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007930907.334, "dur": 0.948, + "args": { + "External id": 447968,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930913.780, "dur": 9.731, + "args": { + "External id": 447969,"Record function id": 0, "Sequence number": 5285438, "Fwd thread id": 1, "Ev Idx": 1504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930914.705, "dur": 6.780, + "args": { + "External id": 447970,"Sequence number": 5285438, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1505 + } + }, + { + "ph": "f", "id": 162, "pid": 4183441, "tid": 31362, "ts": 676007930914.705, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007930915.790, "dur": 5.484, + "args": { + "External id": 447971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007930918.441, "dur": 2.178, + "args": { + "External id": 447972,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930920.045, "dur": 0.490, + "args": { + "External id": 447973,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007930929.267, "dur": 9.100, + "args": { + "External id": 447974,"Record function id": 0, "Ev Idx": 1509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007930931.331, "dur": 6.382, + "args": { + "External id": 447975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007930933.903, "dur": 3.382, + "args": { + "External id": 447976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007930934.893, "dur": 2.298, + "args": { + "External id": 447977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930941.794, "dur": 6.173, + "args": { + "External id": 447978,"Record function id": 0, "Sequence number": 5285437, "Fwd thread id": 1, "Ev Idx": 1513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930943.902, "dur": 2.582, + "args": { + "External id": 447979,"Sequence number": 5285437, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1514 + } + }, + { + "ph": "f", "id": 163, "pid": 4183441, "tid": 31362, "ts": 676007930943.902, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007930944.839, "dur": 1.484, + "args": { + "External id": 447980,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007930945.568, "dur": 0.661, + "args": { + "External id": 447981,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930952.705, "dur": 97.630, + "args": { + "External id": 447982,"Record function id": 0, "Sequence number": 5285436, "Fwd thread id": 1, "Ev Idx": 1517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007930953.559, "dur": 90.196, + "args": { + "External id": 447983,"Sequence number": 5285436, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1518 + } + }, + { + "ph": "f", "id": 164, "pid": 4183441, "tid": 31362, "ts": 676007930953.559, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007930956.856, "dur": 2.805, + "args": { + "External id": 447984,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007930957.349, "dur": 1.856, + "args": { + "External id": 447985,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930958.632, "dur": 0.469, + "args": { + "External id": 447986,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007930960.182, "dur": 33.887, + "args": { + "External id": 447987,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007930995.101, "dur": 5.928, + "args": { + "External id": 447988,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007930995.998, "dur": 4.479, + "args": { + "External id": 447989,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007930999.294, "dur": 1.077, + "args": { + "External id": 447990,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007931002.198, "dur": 6.708, + "args": { + "External id": 447991,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007931003.854, "dur": 4.132, + "args": { + "External id": 447992,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931005.429, "dur": 2.451, + "args": { + "External id": 447993,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007931009.475, "dur": 33.411, + "args": { + "External id": 447994,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931056.289, "dur": 55.681, + "args": { + "External id": 447995,"Record function id": 0, "Sequence number": 5285435, "Fwd thread id": 1, "Ev Idx": 1530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931057.693, "dur": 8.590, + "args": { + "External id": 447996,"Sequence number": 5285435, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1531 + } + }, + { + "ph": "f", "id": 165, "pid": 4183441, "tid": 31362, "ts": 676007931057.693, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007931060.897, "dur": 5.240, + "args": { + "External id": 447997,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007931064.811, "dur": 1.189, + "args": { + "External id": 447998,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 31362, + "ts": 676007931069.623, "dur": 38.961, + "args": { + "External id": 447999,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931117.647, "dur": 26.559, + "args": { + "External id": 448000,"Record function id": 0, "Sequence number": 5285434, "Fwd thread id": 1, "Ev Idx": 1535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931134.753, "dur": 7.019, + "args": { + "External id": 448001,"Sequence number": 5285434, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1536 + } + }, + { + "ph": "f", "id": 166, "pid": 4183441, "tid": 31362, "ts": 676007931134.753, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007931135.754, "dur": 5.784, + "args": { + "External id": 448002,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007931136.621, "dur": 4.175, + "args": { + "External id": 448003,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931140.159, "dur": 0.516, + "args": { + "External id": 448004,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007931148.444, "dur": 6.034, + "args": { + "External id": 448005,"Record function id": 0, "Ev Idx": 1540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007931149.939, "dur": 3.968, + "args": { + "External id": 448006,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007931151.432, "dur": 2.139, + "args": { + "External id": 448007,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007931151.910, "dur": 1.557, + "args": { + "External id": 448008,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931157.553, "dur": 6.955, + "args": { + "External id": 448009,"Record function id": 0, "Sequence number": 5285433, "Fwd thread id": 1, "Ev Idx": 1544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931158.951, "dur": 3.788, + "args": { + "External id": 448010,"Sequence number": 5285433, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1545 + } + }, + { + "ph": "f", "id": 167, "pid": 4183441, "tid": 31362, "ts": 676007931158.951, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007931160.631, "dur": 1.965, + "args": { + "External id": 448011,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007931161.579, "dur": 0.889, + "args": { + "External id": 448012,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931167.716, "dur": 101.618, + "args": { + "External id": 448013,"Record function id": 0, "Sequence number": 5285432, "Fwd thread id": 1, "Ev Idx": 1548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931168.618, "dur": 92.223, + "args": { + "External id": 448014,"Sequence number": 5285432, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1549 + } + }, + { + "ph": "f", "id": 168, "pid": 4183441, "tid": 31362, "ts": 676007931168.618, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007931173.654, "dur": 2.722, + "args": { + "External id": 448015,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007931174.058, "dur": 1.859, + "args": { + "External id": 448016,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[65536, 1024], [], []], "Ev Idx": 1551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931175.341, "dur": 0.479, + "args": { + "External id": 448017,"Record function id": 0, "Concrete Inputs": ["", "[1024, 65536]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 1552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007931177.183, "dur": 40.584, + "args": { + "External id": 448018,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024]], "Ev Idx": 1553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007931218.674, "dur": 5.036, + "args": { + "External id": 448019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007931219.214, "dur": 3.921, + "args": { + "External id": 448020,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931222.574, "dur": 0.448, + "args": { + "External id": 448021,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007931225.046, "dur": 3.441, + "args": { + "External id": 448022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007931226.352, "dur": 1.698, + "args": { + "External id": 448023,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931227.616, "dur": 0.345, + "args": { + "External id": 448024,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007931228.943, "dur": 31.189, + "args": { + "External id": 448025,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 1560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931273.416, "dur": 24.972, + "args": { + "External id": 448026,"Record function id": 0, "Sequence number": 5285431, "Fwd thread id": 1, "Ev Idx": 1561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931274.231, "dur": 3.966, + "args": { + "External id": 448027,"Sequence number": 5285431, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 1562 + } + }, + { + "ph": "f", "id": 169, "pid": 4183441, "tid": 31362, "ts": 676007931274.231, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007931275.982, "dur": 2.058, + "args": { + "External id": 448028,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007931276.851, "dur": 1.052, + "args": { + "External id": 448029,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007931280.531, "dur": 15.450, + "args": { + "External id": 448030,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931301.681, "dur": 9.746, + "args": { + "External id": 448031,"Record function id": 0, "Sequence number": 5285430, "Fwd thread id": 1, "Ev Idx": 1566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 4183441, "tid": 31362, + "ts": 676007931304.853, "dur": 4.654, + "args": { + "External id": 448032,"Sequence number": 5285430, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1567 + } + }, + { + "ph": "f", "id": 170, "pid": 4183441, "tid": 31362, "ts": 676007931304.853, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 31362, + "ts": 676007931305.480, "dur": 3.804, + "args": { + "External id": 448033,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 1024]], "Input Dims": [[1024, 1024]], "Ev Idx": 1568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 31362, + "ts": 676007931306.245, "dur": 2.494, + "args": { + "External id": 448034,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 1024], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 1569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931308.044, "dur": 0.609, + "args": { + "External id": 448035,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1024, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1024], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 1570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007931315.231, "dur": 4.951, + "args": { + "External id": 448036,"Record function id": 0, "Ev Idx": 1571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007931316.937, "dur": 2.796, + "args": { + "External id": 448037,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007931318.033, "dur": 1.458, + "args": { + "External id": 448038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007931318.355, "dur": 1.039, + "args": { + "External id": 448039,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007931324.461, "dur": 378.557, + "args": { + "External id": 448040,"Record function id": 0, "Sequence number": 5285429, "Fwd thread id": 1, "Ev Idx": 1575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007931325.862, "dur": 301.008, + "args": { + "External id": 448041,"Sequence number": 5285429, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1576 + } + }, + { + "ph": "f", "id": 171, "pid": 4183441, "tid": 31362, "ts": 676007931325.862, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007931357.708, "dur": 3.395, + "args": { + "External id": 448042,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007931359.922, "dur": 1.015, + "args": { + "External id": 448043,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 1578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007931375.159, "dur": 5.455, + "args": { + "External id": 448044,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007931389.696, "dur": 2.847, + "args": { + "External id": 448045,"Record function id": 0, "Concrete Inputs": ["[132, 1024]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007931531.967, "dur": 1.878, + "args": { + "External id": 448046,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 1024]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[132, 1024], []], "Ev Idx": 1581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 31362, + "ts": 676007931537.945, "dur": 32.542, + "args": { + "External id": 448047,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[135168, 1024, 1], [], [], []], "Input Dims": [[1, 132, 1024], [], [], []], "Ev Idx": 1582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931547.538, "dur": 0.861, + "args": { + "External id": 448048,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 1024]", "[1024, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1, 1024], [], [], []], "Ev Idx": 1583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007931576.141, "dur": 29.979, + "args": { + "External id": 448049,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], []], "Ev Idx": 1584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007931579.849, "dur": 26.044, + "args": { + "External id": 448050,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[1, 1024], [], [], [], [], [], []], "Ev Idx": 1585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931584.232, "dur": 3.668, + "args": { + "External id": 448051,"Record function id": 0, "Concrete Inputs": ["[1, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007931589.400, "dur": 15.981, + "args": { + "External id": 448052,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[1, 1024], [1, 1024], []], "Ev Idx": 1587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 31362, + "ts": 676007931610.460, "dur": 2.685, + "args": { + "External id": 448053,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1]], "Input Dims": [[1, 1024], [1024]], "Ev Idx": 1588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007931611.874, "dur": 1.171, + "args": { + "External id": 448054,"Record function id": 0, "Concrete Inputs": ["", "[1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[1, 1024], []], "Ev Idx": 1589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 31362, + "ts": 676007931618.665, "dur": 1.927, + "args": { + "External id": 448055,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007931619.791, "dur": 0.715, + "args": { + "External id": 448056,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 1591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 31362, + "ts": 676007931643.145, "dur": 53.828, + "args": { + "External id": 448057,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 1592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007931715.092, "dur": 8.994, + "args": { + "External id": 448058,"Record function id": 0, "Ev Idx": 1593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007931717.449, "dur": 5.918, + "args": { + "External id": 448059,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007931719.694, "dur": 2.704, + "args": { + "External id": 448060,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007931720.519, "dur": 1.780, + "args": { + "External id": 448061,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007931728.508, "dur": 2780.951, + "args": { + "External id": 448062,"Record function id": 0, "Ev Idx": 1597 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.19)", "pid": 4183441, "tid": 31362, + "ts": 676007931760.730, "dur": 1105.159, + "args": { + "External id": 448063,"Record function id": 0, "Ev Idx": 1598 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.18", "pid": 4183441, "tid": 31362, + "ts": 676007931787.159, "dur": 1070.471, + "args": { + "External id": 448064,"Record function id": 0, "Ev Idx": 1599 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 4183441, "tid": 31362, + "ts": 676007931802.369, "dur": 1038.438, + "args": { + "External id": 448065,"Record function id": 0, "Ev Idx": 1600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007931898.152, "dur": 8.808, + "args": { + "External id": 448066,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676007931923.047, "dur": 34.375, + "args": { + "External id": 448067,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931927.157, "dur": 1.327, + "args": { + "External id": 448068,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931930.387, "dur": 2.586, + "args": { + "External id": 448069,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931936.157, "dur": 0.347, + "args": { + "External id": 448070,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931937.851, "dur": 0.462, + "args": { + "External id": 448071,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931939.491, "dur": 0.344, + "args": { + "External id": 448072,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931943.168, "dur": 0.398, + "args": { + "External id": 448073,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931945.109, "dur": 0.478, + "args": { + "External id": 448074,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931947.097, "dur": 2.119, + "args": { + "External id": 448075,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007931950.916, "dur": 0.355, + "args": { + "External id": 448076,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676007931973.719, "dur": 34.158, + "args": { + "External id": 448077,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676007932052.521, "dur": 139.604, + "args": { + "External id": 448078,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 1613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007932063.739, "dur": 6.835, + "args": { + "External id": 448079,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676007932077.335, "dur": 31.393, + "args": { + "External id": 448080,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007932101.341, "dur": 6.973, + "args": { + "External id": 448081,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 1616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932105.692, "dur": 0.761, + "args": { + "External id": 448082,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676007932117.906, "dur": 29.584, + "args": { + "External id": 448083,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932120.317, "dur": 0.482, + "args": { + "External id": 448084,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932122.359, "dur": 1.710, + "args": { + "External id": 448085,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932125.582, "dur": 0.556, + "args": { + "External id": 448086,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932127.358, "dur": 0.328, + "args": { + "External id": 448087,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932131.087, "dur": 0.294, + "args": { + "External id": 448088,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932132.836, "dur": 0.471, + "args": { + "External id": 448089,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932134.575, "dur": 2.308, + "args": { + "External id": 448090,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932139.556, "dur": 0.487, + "args": { + "External id": 448091,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007932141.214, "dur": 0.514, + "args": { + "External id": 448092,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676007932158.698, "dur": 24.784, + "args": { + "External id": 448093,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676007932258.642, "dur": 467.210, + "args": { + "External id": 448094,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 1629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676007932294.338, "dur": 425.247, + "args": { + "External id": 448095,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1630, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676007932306.340, "dur": 406.618, + "args": { + "External id": 448096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 1631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676007932751.525, "dur": 3.115, + "args": { + "External id": 448097,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1632, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007932874.364, "dur": 1613.223, + "args": { + "External id": 448098,"Sequence number": 5285428, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1633 + } + }, + { + "ph": "f", "id": 172, "pid": 4183441, "tid": 31362, "ts": 676007932874.364, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007933008.090, "dur": 124.578, + "args": { + "External id": 448099,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 1634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676007933178.228, "dur": 38.332, + "args": { + "External id": 448100,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 1635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676007933237.638, "dur": 45.504, + "args": { + "External id": 448101,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 1636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007933292.200, "dur": 28.393, + "args": { + "External id": 448102,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007933326.430, "dur": 35.069, + "args": { + "External id": 448103,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007933370.081, "dur": 23.487, + "args": { + "External id": 448104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007933400.995, "dur": 28.581, + "args": { + "External id": 448105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676007933454.779, "dur": 24.002, + "args": { + "External id": 448106,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 1641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676007933499.611, "dur": 27.052, + "args": { + "External id": 448107,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676007933549.076, "dur": 18.215, + "args": { + "External id": 448108,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676007933582.779, "dur": 14.452, + "args": { + "External id": 448109,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007933610.211, "dur": 36.514, + "args": { + "External id": 448110,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007933650.197, "dur": 68.249, + "args": { + "External id": 448111,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676007933752.424, "dur": 170.203, + "args": { + "External id": 448112,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007933830.004, "dur": 5.418, + "args": { + "External id": 448113,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007933837.310, "dur": 5.922, + "args": { + "External id": 448114,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676007933961.067, "dur": 29.466, + "args": { + "External id": 448115,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676007934003.423, "dur": 13.547, + "args": { + "External id": 448116,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007934026.688, "dur": 46.127, + "args": { + "External id": 448117,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007934078.272, "dur": 49.989, + "args": { + "External id": 448118,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007934138.075, "dur": 30.389, + "args": { + "External id": 448119,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007934175.371, "dur": 28.703, + "args": { + "External id": 448120,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007934209.549, "dur": 27.546, + "args": { + "External id": 448121,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007934244.187, "dur": 28.995, + "args": { + "External id": 448122,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676007934294.558, "dur": 22.543, + "args": { + "External id": 448123,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 1658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676007934339.020, "dur": 25.028, + "args": { + "External id": 448124,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676007934381.718, "dur": 15.634, + "args": { + "External id": 448125,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676007934413.779, "dur": 12.931, + "args": { + "External id": 448126,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676007934443.044, "dur": 15.913, + "args": { + "External id": 448127,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 1662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934530.410, "dur": 14.262, + "args": { + "External id": 448128,"Record function id": 0, "Ev Idx": 1663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934533.815, "dur": 10.088, + "args": { + "External id": 448129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934537.708, "dur": 5.422, + "args": { + "External id": 448130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934539.261, "dur": 3.777, + "args": { + "External id": 448131,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934548.571, "dur": 5.352, + "args": { + "External id": 448132,"Record function id": 0, "Ev Idx": 1667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934550.130, "dur": 3.341, + "args": { + "External id": 448133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934551.316, "dur": 1.680, + "args": { + "External id": 448134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934551.999, "dur": 0.902, + "args": { + "External id": 448135,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934557.091, "dur": 3.965, + "args": { + "External id": 448136,"Record function id": 0, "Ev Idx": 1671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934558.209, "dur": 2.444, + "args": { + "External id": 448137,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934558.856, "dur": 1.398, + "args": { + "External id": 448138,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934559.370, "dur": 0.818, + "args": { + "External id": 448139,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934564.245, "dur": 6.468, + "args": { + "External id": 448140,"Record function id": 0, "Ev Idx": 1675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934565.991, "dur": 4.300, + "args": { + "External id": 448141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934566.690, "dur": 2.932, + "args": { + "External id": 448142,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934567.245, "dur": 2.304, + "args": { + "External id": 448143,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934573.687, "dur": 3.704, + "args": { + "External id": 448144,"Record function id": 0, "Ev Idx": 1679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934574.741, "dur": 2.246, + "args": { + "External id": 448145,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934575.513, "dur": 1.059, + "args": { + "External id": 448146,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934575.776, "dur": 0.722, + "args": { + "External id": 448147,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934580.393, "dur": 5.868, + "args": { + "External id": 448148,"Record function id": 0, "Ev Idx": 1683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934581.866, "dur": 3.976, + "args": { + "External id": 448149,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934582.423, "dur": 2.886, + "args": { + "External id": 448150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934584.616, "dur": 0.624, + "args": { + "External id": 448151,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934589.368, "dur": 4.198, + "args": { + "External id": 448152,"Record function id": 0, "Ev Idx": 1687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934590.753, "dur": 2.398, + "args": { + "External id": 448153,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934591.367, "dur": 1.341, + "args": { + "External id": 448154,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934591.829, "dur": 0.815, + "args": { + "External id": 448155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934596.590, "dur": 3.945, + "args": { + "External id": 448156,"Record function id": 0, "Ev Idx": 1691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934597.725, "dur": 2.388, + "args": { + "External id": 448157,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934598.273, "dur": 1.284, + "args": { + "External id": 448158,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934598.653, "dur": 0.838, + "args": { + "External id": 448159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934605.022, "dur": 4.198, + "args": { + "External id": 448160,"Record function id": 0, "Ev Idx": 1695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007934606.267, "dur": 2.532, + "args": { + "External id": 448161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007934606.880, "dur": 1.536, + "args": { + "External id": 448162,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007934607.481, "dur": 0.873, + "args": { + "External id": 448163,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007934613.268, "dur": 57979.327, + "args": { + "External id": 448164,"Record function id": 0, "Sequence number": 5285427, "Fwd thread id": 1, "Ev Idx": 1699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007934614.933, "dur": 57969.011, + "args": { + "External id": 448165,"Sequence number": 5285427, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1700 + } + }, + { + "ph": "f", "id": 173, "pid": 4183441, "tid": 31362, "ts": 676007934614.933, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.19)", "pid": 4183441, "tid": 31362, + "ts": 676007934647.550, "dur": 79.837, + "args": { + "External id": 448166,"Record function id": 0, "Ev Idx": 1701 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.19)", "pid": 4183441, "tid": 31362, + "ts": 676007934736.595, "dur": 95.554, + "args": { + "External id": 448167,"Record function id": 0, "Ev Idx": 1702 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.19)", "pid": 4183441, "tid": 31362, + "ts": 676007934838.571, "dur": 57738.019, + "args": { + "External id": 448168,"Record function id": 0, "Ev Idx": 1703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007934898.744, "dur": 8.449, + "args": { + "External id": 448169,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007934917.829, "dur": 8.003, + "args": { + "External id": 448170,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676007934943.477, "dur": 56900.994, + "args": { + "External id": 448171,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676007934963.824, "dur": 56870.633, + "args": { + "External id": 448172,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007934994.279, "dur": 7.545, + "args": { + "External id": 448173,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007935008.103, "dur": 56787.353, + "args": { + "External id": 448174,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 1709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007935010.631, "dur": 56784.074, + "args": { + "External id": 448175,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 1710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007935014.255, "dur": 5.558, + "args": { + "External id": 448176,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007935021.345, "dur": 56769.396, + "args": { + "External id": 448177,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 1712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676007991939.765, "dur": 10.520, + "args": { + "External id": 448178,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 1713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007991943.139, "dur": 6.851, + "args": { + "External id": 448179,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676007991986.396, "dur": 269.316, + "args": { + "External id": 448180,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 1715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676007992017.245, "dur": 233.720, + "args": { + "External id": 448181,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1716, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676007992031.568, "dur": 213.972, + "args": { + "External id": 448182,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 1717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676007992276.843, "dur": 2.142, + "args": { + "External id": 448183,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1718, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992334.200, "dur": 6.311, + "args": { + "External id": 448184,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992394.455, "dur": 1.158, + "args": { + "External id": 448185,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992414.066, "dur": 1.587, + "args": { + "External id": 448186,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992436.386, "dur": 1.112, + "args": { + "External id": 448187,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992451.042, "dur": 0.938, + "args": { + "External id": 448188,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992464.069, "dur": 1.063, + "args": { + "External id": 448189,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992479.513, "dur": 1.520, + "args": { + "External id": 448190,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992496.456, "dur": 2.533, + "args": { + "External id": 448191,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992512.814, "dur": 0.841, + "args": { + "External id": 448192,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007992607.344, "dur": 2755.074, + "args": { + "External id": 448193,"Record function id": 0, "Ev Idx": 1728 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.18)", "pid": 4183441, "tid": 31362, + "ts": 676007992626.891, "dur": 1105.593, + "args": { + "External id": 448194,"Record function id": 0, "Ev Idx": 1729 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 4183441, "tid": 31362, + "ts": 676007992641.172, "dur": 361.682, + "args": { + "External id": 448195,"Record function id": 0, "Ev Idx": 1730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992770.952, "dur": 4.823, + "args": { + "External id": 448196,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992779.054, "dur": 1.176, + "args": { + "External id": 448197,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992782.073, "dur": 0.971, + "args": { + "External id": 448198,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992784.695, "dur": 3.092, + "args": { + "External id": 448199,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992789.198, "dur": 1.014, + "args": { + "External id": 448200,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992793.523, "dur": 1.163, + "args": { + "External id": 448201,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992796.439, "dur": 2.588, + "args": { + "External id": 448202,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992800.636, "dur": 0.855, + "args": { + "External id": 448203,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992803.235, "dur": 0.994, + "args": { + "External id": 448204,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007992807.458, "dur": 0.957, + "args": { + "External id": 448205,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676007992827.479, "dur": 145.176, + "args": { + "External id": 448206,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676007992845.115, "dur": 123.660, + "args": { + "External id": 448207,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007992863.039, "dur": 12.670, + "args": { + "External id": 448208,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007992878.721, "dur": 62.309, + "args": { + "External id": 448209,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 1744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007992881.226, "dur": 59.361, + "args": { + "External id": 448210,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 1745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007992885.181, "dur": 7.462, + "args": { + "External id": 448211,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007992894.306, "dur": 45.756, + "args": { + "External id": 448212,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 1747 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.17", "pid": 4183441, "tid": 31362, + "ts": 676007993116.953, "dur": 606.649, + "args": { + "External id": 448213,"Record function id": 0, "Ev Idx": 1748 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 4183441, "tid": 31362, + "ts": 676007993136.030, "dur": 572.941, + "args": { + "External id": 448214,"Record function id": 0, "Ev Idx": 1749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007993201.341, "dur": 5.211, + "args": { + "External id": 448215,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676007993222.223, "dur": 36.806, + "args": { + "External id": 448216,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993226.980, "dur": 3.098, + "args": { + "External id": 448217,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993231.915, "dur": 0.504, + "args": { + "External id": 448218,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993234.009, "dur": 0.569, + "args": { + "External id": 448219,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993238.012, "dur": 0.477, + "args": { + "External id": 448220,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993240.351, "dur": 0.516, + "args": { + "External id": 448221,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993241.906, "dur": 0.883, + "args": { + "External id": 448222,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993245.530, "dur": 1.804, + "args": { + "External id": 448223,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993248.542, "dur": 0.531, + "args": { + "External id": 448224,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993250.567, "dur": 1.742, + "args": { + "External id": 448225,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676007993272.920, "dur": 33.025, + "args": { + "External id": 448226,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676007993339.398, "dur": 106.352, + "args": { + "External id": 448227,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 1762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007993349.086, "dur": 4.548, + "args": { + "External id": 448228,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676007993359.328, "dur": 12.427, + "args": { + "External id": 448229,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676007993363.322, "dur": 7.970, + "args": { + "External id": 448230,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 1765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993369.382, "dur": 0.488, + "args": { + "External id": 448231,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676007993379.062, "dur": 28.448, + "args": { + "External id": 448232,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993381.492, "dur": 0.386, + "args": { + "External id": 448233,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993383.191, "dur": 1.680, + "args": { + "External id": 448234,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993386.019, "dur": 0.522, + "args": { + "External id": 448235,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993388.069, "dur": 2.008, + "args": { + "External id": 448236,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993393.048, "dur": 0.482, + "args": { + "External id": 448237,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993394.800, "dur": 0.437, + "args": { + "External id": 448238,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993396.369, "dur": 0.676, + "args": { + "External id": 448239,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993399.005, "dur": 0.400, + "args": { + "External id": 448240,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676007993400.800, "dur": 0.508, + "args": { + "External id": 448241,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676007993419.298, "dur": 19.022, + "args": { + "External id": 448242,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676007993489.165, "dur": 115.655, + "args": { + "External id": 448243,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 1778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676007993516.964, "dur": 84.537, + "args": { + "External id": 448244,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1779, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676007993527.830, "dur": 69.623, + "args": { + "External id": 448245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 1780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676007993621.165, "dur": 1.821, + "args": { + "External id": 448246,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1781, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007993740.390, "dur": 1598.159, + "args": { + "External id": 448247,"Sequence number": 5285426, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1782 + } + }, + { + "ph": "f", "id": 174, "pid": 4183441, "tid": 31362, "ts": 676007993740.390, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007993854.106, "dur": 99.376, + "args": { + "External id": 448248,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 1783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676007993997.290, "dur": 44.110, + "args": { + "External id": 448249,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 1784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676007994058.167, "dur": 61.758, + "args": { + "External id": 448250,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 1785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994133.345, "dur": 31.589, + "args": { + "External id": 448251,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994173.162, "dur": 34.729, + "args": { + "External id": 448252,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994214.523, "dur": 23.719, + "args": { + "External id": 448253,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994245.684, "dur": 28.575, + "args": { + "External id": 448254,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676007994299.118, "dur": 25.573, + "args": { + "External id": 448255,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 1790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676007994344.358, "dur": 25.640, + "args": { + "External id": 448256,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676007994393.155, "dur": 19.524, + "args": { + "External id": 448257,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676007994428.195, "dur": 13.196, + "args": { + "External id": 448258,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994448.840, "dur": 36.117, + "args": { + "External id": 448259,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994488.239, "dur": 30.404, + "args": { + "External id": 448260,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676007994545.858, "dur": 203.391, + "args": { + "External id": 448261,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007994622.921, "dur": 6.783, + "args": { + "External id": 448262,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007994631.289, "dur": 2.302, + "args": { + "External id": 448263,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676007994788.916, "dur": 24.680, + "args": { + "External id": 448264,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676007994827.701, "dur": 13.434, + "args": { + "External id": 448265,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994849.881, "dur": 48.707, + "args": { + "External id": 448266,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994903.977, "dur": 32.356, + "args": { + "External id": 448267,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994944.920, "dur": 27.978, + "args": { + "External id": 448268,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007994977.305, "dur": 28.527, + "args": { + "External id": 448269,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007995012.436, "dur": 39.420, + "args": { + "External id": 448270,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676007995064.674, "dur": 52.529, + "args": { + "External id": 448271,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676007995142.630, "dur": 22.660, + "args": { + "External id": 448272,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 1807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676007995182.888, "dur": 25.269, + "args": { + "External id": 448273,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676007995224.243, "dur": 16.529, + "args": { + "External id": 448274,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676007995263.023, "dur": 13.513, + "args": { + "External id": 448275,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676007995291.674, "dur": 15.218, + "args": { + "External id": 448276,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 1811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995383.837, "dur": 14.712, + "args": { + "External id": 448277,"Record function id": 0, "Ev Idx": 1812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995387.655, "dur": 10.009, + "args": { + "External id": 448278,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995391.539, "dur": 5.283, + "args": { + "External id": 448279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995392.864, "dur": 3.841, + "args": { + "External id": 448280,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995402.695, "dur": 8.770, + "args": { + "External id": 448281,"Record function id": 0, "Ev Idx": 1816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995408.196, "dur": 2.823, + "args": { + "External id": 448282,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995408.995, "dur": 1.560, + "args": { + "External id": 448283,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995409.708, "dur": 0.728, + "args": { + "External id": 448284,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995414.925, "dur": 7.355, + "args": { + "External id": 448285,"Record function id": 0, "Ev Idx": 1820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995416.990, "dur": 4.885, + "args": { + "External id": 448286,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995417.571, "dur": 3.666, + "args": { + "External id": 448287,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995418.151, "dur": 3.006, + "args": { + "External id": 448288,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995425.807, "dur": 4.942, + "args": { + "External id": 448289,"Record function id": 0, "Ev Idx": 1824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995427.469, "dur": 2.893, + "args": { + "External id": 448290,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995428.448, "dur": 1.302, + "args": { + "External id": 448291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995428.788, "dur": 0.896, + "args": { + "External id": 448292,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995434.107, "dur": 4.648, + "args": { + "External id": 448293,"Record function id": 0, "Ev Idx": 1828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995436.044, "dur": 2.327, + "args": { + "External id": 448294,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995436.635, "dur": 1.049, + "args": { + "External id": 448295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995436.927, "dur": 0.690, + "args": { + "External id": 448296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995442.406, "dur": 4.403, + "args": { + "External id": 448297,"Record function id": 0, "Ev Idx": 1832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995444.246, "dur": 2.166, + "args": { + "External id": 448298,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995444.958, "dur": 1.036, + "args": { + "External id": 448299,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995445.355, "dur": 0.575, + "args": { + "External id": 448300,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995450.292, "dur": 4.499, + "args": { + "External id": 448301,"Record function id": 0, "Ev Idx": 1836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995452.011, "dur": 2.358, + "args": { + "External id": 448302,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995452.706, "dur": 1.230, + "args": { + "External id": 448303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995452.979, "dur": 0.861, + "args": { + "External id": 448304,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995458.039, "dur": 9.078, + "args": { + "External id": 448305,"Record function id": 0, "Ev Idx": 1840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995459.492, "dur": 7.241, + "args": { + "External id": 448306,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995460.110, "dur": 6.100, + "args": { + "External id": 448307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995462.305, "dur": 3.842, + "args": { + "External id": 448308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995470.243, "dur": 3.809, + "args": { + "External id": 448309,"Record function id": 0, "Ev Idx": 1844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676007995471.626, "dur": 2.043, + "args": { + "External id": 448310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676007995472.104, "dur": 1.128, + "args": { + "External id": 448311,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676007995472.547, "dur": 0.621, + "args": { + "External id": 448312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007995477.733, "dur": 15154.784, + "args": { + "External id": 448313,"Record function id": 0, "Sequence number": 5285425, "Fwd thread id": 1, "Ev Idx": 1848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676007995478.876, "dur": 15145.205, + "args": { + "External id": 448314,"Sequence number": 5285425, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1849 + } + }, + { + "ph": "f", "id": 175, "pid": 4183441, "tid": 31362, "ts": 676007995478.876, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.18)", "pid": 4183441, "tid": 31362, + "ts": 676007995506.863, "dur": 37.038, + "args": { + "External id": 448315,"Record function id": 0, "Ev Idx": 1850 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.18)", "pid": 4183441, "tid": 31362, + "ts": 676007995551.412, "dur": 72.657, + "args": { + "External id": 448316,"Record function id": 0, "Ev Idx": 1851 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.18)", "pid": 4183441, "tid": 31362, + "ts": 676007995631.718, "dur": 14985.848, + "args": { + "External id": 448317,"Record function id": 0, "Ev Idx": 1852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007995786.684, "dur": 7.003, + "args": { + "External id": 448318,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676007995804.698, "dur": 6.767, + "args": { + "External id": 448319,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676007995827.672, "dur": 14064.666, + "args": { + "External id": 448320,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676007995841.851, "dur": 14042.720, + "args": { + "External id": 448321,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 1856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676007995866.762, "dur": 13.637, + "args": { + "External id": 448322,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676007995884.814, "dur": 13966.183, + "args": { + "External id": 448323,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 1858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676007995887.073, "dur": 13963.251, + "args": { + "External id": 448324,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 1859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676007995892.399, "dur": 4.677, + "args": { + "External id": 448325,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676007995900.611, "dur": 13946.578, + "args": { + "External id": 448326,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 1861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008009978.005, "dur": 9.345, + "args": { + "External id": 448327,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 1862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008009981.143, "dur": 5.842, + "args": { + "External id": 448328,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008010015.643, "dur": 307.408, + "args": { + "External id": 448329,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 1864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008010045.750, "dur": 272.087, + "args": { + "External id": 448330,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1865, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008010058.574, "dur": 254.064, + "args": { + "External id": 448331,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 1866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008010344.905, "dur": 2.032, + "args": { + "External id": 448332,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1867, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010402.744, "dur": 6.153, + "args": { + "External id": 448333,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010455.312, "dur": 1.737, + "args": { + "External id": 448334,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010473.150, "dur": 2.847, + "args": { + "External id": 448335,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010488.618, "dur": 0.989, + "args": { + "External id": 448336,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010503.707, "dur": 1.011, + "args": { + "External id": 448337,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010516.428, "dur": 0.905, + "args": { + "External id": 448338,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010529.439, "dur": 3.730, + "args": { + "External id": 448339,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010545.747, "dur": 2.775, + "args": { + "External id": 448340,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010558.719, "dur": 0.941, + "args": { + "External id": 448341,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008010646.387, "dur": 2714.270, + "args": { + "External id": 448342,"Record function id": 0, "Ev Idx": 1877 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.17)", "pid": 4183441, "tid": 31362, + "ts": 676008010703.068, "dur": 1031.270, + "args": { + "External id": 448343,"Record function id": 0, "Ev Idx": 1878 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 4183441, "tid": 31362, + "ts": 676008010720.539, "dur": 309.790, + "args": { + "External id": 448344,"Record function id": 0, "Ev Idx": 1879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010804.871, "dur": 4.820, + "args": { + "External id": 448345,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 1880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010813.317, "dur": 1.095, + "args": { + "External id": 448346,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010816.367, "dur": 3.142, + "args": { + "External id": 448347,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010821.957, "dur": 1.275, + "args": { + "External id": 448348,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010824.693, "dur": 0.894, + "args": { + "External id": 448349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010826.840, "dur": 1.058, + "args": { + "External id": 448350,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 1885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010829.380, "dur": 2.416, + "args": { + "External id": 448351,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 1886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010834.896, "dur": 1.329, + "args": { + "External id": 448352,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010837.817, "dur": 0.754, + "args": { + "External id": 448353,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008010840.161, "dur": 0.808, + "args": { + "External id": 448354,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 1889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008010857.107, "dur": 144.683, + "args": { + "External id": 448355,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008010872.225, "dur": 125.249, + "args": { + "External id": 448356,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 1891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008010889.920, "dur": 16.244, + "args": { + "External id": 448357,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008010909.198, "dur": 61.605, + "args": { + "External id": 448358,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 1893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008010911.488, "dur": 59.038, + "args": { + "External id": 448359,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 1894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008010915.392, "dur": 6.289, + "args": { + "External id": 448360,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008010923.143, "dur": 46.877, + "args": { + "External id": 448361,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 1896 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.16", "pid": 4183441, "tid": 31362, + "ts": 676008011140.671, "dur": 585.842, + "args": { + "External id": 448362,"Record function id": 0, "Ev Idx": 1897 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 4183441, "tid": 31362, + "ts": 676008011159.180, "dur": 554.615, + "args": { + "External id": 448363,"Record function id": 0, "Ev Idx": 1898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008011220.673, "dur": 5.210, + "args": { + "External id": 448364,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008011240.619, "dur": 34.913, + "args": { + "External id": 448365,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011245.124, "dur": 3.126, + "args": { + "External id": 448366,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011250.174, "dur": 0.483, + "args": { + "External id": 448367,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011252.196, "dur": 0.498, + "args": { + "External id": 448368,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011255.785, "dur": 0.373, + "args": { + "External id": 448369,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011257.467, "dur": 0.844, + "args": { + "External id": 448370,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011259.649, "dur": 2.084, + "args": { + "External id": 448371,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011264.055, "dur": 0.433, + "args": { + "External id": 448372,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011265.758, "dur": 0.470, + "args": { + "External id": 448373,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011267.591, "dur": 1.858, + "args": { + "External id": 448374,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008011285.700, "dur": 34.328, + "args": { + "External id": 448375,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008011350.192, "dur": 105.532, + "args": { + "External id": 448376,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 1911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008011362.773, "dur": 3.375, + "args": { + "External id": 448377,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008011370.927, "dur": 10.377, + "args": { + "External id": 448378,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008011374.856, "dur": 6.049, + "args": { + "External id": 448379,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 1914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011379.116, "dur": 0.603, + "args": { + "External id": 448380,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 1915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008011388.191, "dur": 31.741, + "args": { + "External id": 448381,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 1916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011390.283, "dur": 0.519, + "args": { + "External id": 448382,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011392.276, "dur": 0.573, + "args": { + "External id": 448383,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011398.425, "dur": 2.876, + "args": { + "External id": 448384,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011402.667, "dur": 0.476, + "args": { + "External id": 448385,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011404.344, "dur": 0.419, + "args": { + "External id": 448386,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011407.004, "dur": 0.341, + "args": { + "External id": 448387,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011408.823, "dur": 0.337, + "args": { + "External id": 448388,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011410.568, "dur": 0.401, + "args": { + "External id": 448389,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008011413.292, "dur": 0.357, + "args": { + "External id": 448390,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 1925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008011429.092, "dur": 18.994, + "args": { + "External id": 448391,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 1926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008011496.305, "dur": 113.575, + "args": { + "External id": 448392,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 1927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008011525.169, "dur": 81.492, + "args": { + "External id": 448393,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1928, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008011534.135, "dur": 68.548, + "args": { + "External id": 448394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 1929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008011625.736, "dur": 1.888, + "args": { + "External id": 448395,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1930, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008011742.571, "dur": 1596.823, + "args": { + "External id": 448396,"Sequence number": 5285424, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1931 + } + }, + { + "ph": "f", "id": 176, "pid": 4183441, "tid": 31362, "ts": 676008011742.571, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008011857.388, "dur": 99.464, + "args": { + "External id": 448397,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 1932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008011998.884, "dur": 36.602, + "args": { + "External id": 448398,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 1933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008012052.133, "dur": 55.809, + "args": { + "External id": 448399,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 1934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012122.083, "dur": 30.636, + "args": { + "External id": 448400,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012158.867, "dur": 33.590, + "args": { + "External id": 448401,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012198.883, "dur": 20.724, + "args": { + "External id": 448402,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 1937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012231.616, "dur": 29.942, + "args": { + "External id": 448403,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 1938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008012290.951, "dur": 22.931, + "args": { + "External id": 448404,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 1939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008012331.134, "dur": 25.731, + "args": { + "External id": 448405,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008012378.553, "dur": 18.975, + "args": { + "External id": 448406,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008012410.129, "dur": 13.283, + "args": { + "External id": 448407,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012431.837, "dur": 36.776, + "args": { + "External id": 448408,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012471.421, "dur": 29.655, + "args": { + "External id": 448409,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008012528.374, "dur": 209.662, + "args": { + "External id": 448410,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008012604.095, "dur": 6.772, + "args": { + "External id": 448411,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008012612.707, "dur": 2.421, + "args": { + "External id": 448412,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008012774.875, "dur": 25.856, + "args": { + "External id": 448413,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008012814.072, "dur": 15.939, + "args": { + "External id": 448414,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012838.734, "dur": 53.646, + "args": { + "External id": 448415,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012898.076, "dur": 32.255, + "args": { + "External id": 448416,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012942.112, "dur": 29.971, + "args": { + "External id": 448417,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008012976.522, "dur": 32.020, + "args": { + "External id": 448418,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008013013.484, "dur": 27.723, + "args": { + "External id": 448419,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 1954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008013048.907, "dur": 28.815, + "args": { + "External id": 448420,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 1955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008013116.225, "dur": 39.242, + "args": { + "External id": 448421,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 1956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008013180.371, "dur": 28.087, + "args": { + "External id": 448422,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008013225.346, "dur": 18.392, + "args": { + "External id": 448423,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 1958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008013258.963, "dur": 18.390, + "args": { + "External id": 448424,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 1959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008013292.627, "dur": 16.321, + "args": { + "External id": 448425,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 1960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013382.085, "dur": 15.075, + "args": { + "External id": 448426,"Record function id": 0, "Ev Idx": 1961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013385.999, "dur": 10.273, + "args": { + "External id": 448427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013389.957, "dur": 5.459, + "args": { + "External id": 448428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013391.519, "dur": 3.798, + "args": { + "External id": 448429,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013401.184, "dur": 7.071, + "args": { + "External id": 448430,"Record function id": 0, "Ev Idx": 1965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013403.225, "dur": 4.537, + "args": { + "External id": 448431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013403.879, "dur": 3.362, + "args": { + "External id": 448432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013404.376, "dur": 2.782, + "args": { + "External id": 448433,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013411.714, "dur": 4.552, + "args": { + "External id": 448434,"Record function id": 0, "Ev Idx": 1969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013413.251, "dur": 2.615, + "args": { + "External id": 448435,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013413.879, "dur": 1.462, + "args": { + "External id": 448436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013414.341, "dur": 0.912, + "args": { + "External id": 448437,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 1972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013420.082, "dur": 4.229, + "args": { + "External id": 448438,"Record function id": 0, "Ev Idx": 1973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013421.899, "dur": 2.002, + "args": { + "External id": 448439,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013422.477, "dur": 0.923, + "args": { + "External id": 448440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013422.755, "dur": 0.550, + "args": { + "External id": 448441,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 1976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013427.509, "dur": 3.914, + "args": { + "External id": 448442,"Record function id": 0, "Ev Idx": 1977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013429.087, "dur": 1.939, + "args": { + "External id": 448443,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013429.580, "dur": 0.965, + "args": { + "External id": 448444,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013429.878, "dur": 0.602, + "args": { + "External id": 448445,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013435.030, "dur": 4.155, + "args": { + "External id": 448446,"Record function id": 0, "Ev Idx": 1981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013436.373, "dur": 2.417, + "args": { + "External id": 448447,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013437.038, "dur": 1.300, + "args": { + "External id": 448448,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013437.543, "dur": 0.730, + "args": { + "External id": 448449,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013442.456, "dur": 4.000, + "args": { + "External id": 448450,"Record function id": 0, "Ev Idx": 1985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013444.186, "dur": 1.860, + "args": { + "External id": 448451,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013444.779, "dur": 0.853, + "args": { + "External id": 448452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013445.053, "dur": 0.516, + "args": { + "External id": 448453,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013449.685, "dur": 5.640, + "args": { + "External id": 448454,"Record function id": 0, "Ev Idx": 1989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013451.031, "dur": 3.907, + "args": { + "External id": 448455,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013451.631, "dur": 2.875, + "args": { + "External id": 448456,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013453.906, "dur": 0.534, + "args": { + "External id": 448457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 1992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013458.526, "dur": 5.683, + "args": { + "External id": 448458,"Record function id": 0, "Ev Idx": 1993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008013460.030, "dur": 3.774, + "args": { + "External id": 448459,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008013460.681, "dur": 2.722, + "args": { + "External id": 448460,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008013460.959, "dur": 2.368, + "args": { + "External id": 448461,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 1996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008013468.967, "dur": 15157.802, + "args": { + "External id": 448462,"Record function id": 0, "Sequence number": 5285423, "Fwd thread id": 1, "Ev Idx": 1997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008013470.471, "dur": 15148.472, + "args": { + "External id": 448463,"Sequence number": 5285423, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 1998 + } + }, + { + "ph": "f", "id": 177, "pid": 4183441, "tid": 31362, "ts": 676008013470.471, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.17)", "pid": 4183441, "tid": 31362, + "ts": 676008013500.240, "dur": 38.523, + "args": { + "External id": 448464,"Record function id": 0, "Ev Idx": 1999 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.17)", "pid": 4183441, "tid": 31362, + "ts": 676008013546.162, "dur": 64.255, + "args": { + "External id": 448465,"Record function id": 0, "Ev Idx": 2000 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.17)", "pid": 4183441, "tid": 31362, + "ts": 676008013618.246, "dur": 14993.420, + "args": { + "External id": 448466,"Record function id": 0, "Ev Idx": 2001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008013741.256, "dur": 7.023, + "args": { + "External id": 448467,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008013758.729, "dur": 5.114, + "args": { + "External id": 448468,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008013777.137, "dur": 14150.814, + "args": { + "External id": 448469,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008013790.315, "dur": 14129.949, + "args": { + "External id": 448470,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008013813.865, "dur": 13.524, + "args": { + "External id": 448471,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008013831.704, "dur": 14053.760, + "args": { + "External id": 448472,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008013834.348, "dur": 14050.469, + "args": { + "External id": 448473,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008013838.129, "dur": 6.000, + "args": { + "External id": 448474,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008013847.666, "dur": 14034.053, + "args": { + "External id": 448475,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008028013.153, "dur": 9.410, + "args": { + "External id": 448476,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008028016.209, "dur": 5.933, + "args": { + "External id": 448477,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008028050.332, "dur": 268.712, + "args": { + "External id": 448478,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008028080.778, "dur": 233.832, + "args": { + "External id": 448479,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2014, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008028104.528, "dur": 205.015, + "args": { + "External id": 448480,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008028338.649, "dur": 2.138, + "args": { + "External id": 448481,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2016, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028393.605, "dur": 5.936, + "args": { + "External id": 448482,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028448.669, "dur": 2.959, + "args": { + "External id": 448483,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028469.415, "dur": 1.187, + "args": { + "External id": 448484,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028483.782, "dur": 0.785, + "args": { + "External id": 448485,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028496.784, "dur": 0.811, + "args": { + "External id": 448486,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028510.012, "dur": 2.262, + "args": { + "External id": 448487,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028526.123, "dur": 1.096, + "args": { + "External id": 448488,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028538.696, "dur": 2.624, + "args": { + "External id": 448489,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028553.739, "dur": 0.915, + "args": { + "External id": 448490,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008028640.380, "dur": 2692.313, + "args": { + "External id": 448491,"Record function id": 0, "Ev Idx": 2026 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.16)", "pid": 4183441, "tid": 31362, + "ts": 676008028692.737, "dur": 1034.988, + "args": { + "External id": 448492,"Record function id": 0, "Ev Idx": 2027 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 4183441, "tid": 31362, + "ts": 676008028708.368, "dur": 307.244, + "args": { + "External id": 448493,"Record function id": 0, "Ev Idx": 2028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028794.465, "dur": 6.046, + "args": { + "External id": 448494,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028803.789, "dur": 0.995, + "args": { + "External id": 448495,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028806.639, "dur": 1.247, + "args": { + "External id": 448496,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028811.039, "dur": 1.019, + "args": { + "External id": 448497,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028813.527, "dur": 0.832, + "args": { + "External id": 448498,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028815.914, "dur": 0.949, + "args": { + "External id": 448499,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028818.687, "dur": 2.503, + "args": { + "External id": 448500,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028824.190, "dur": 0.920, + "args": { + "External id": 448501,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028826.523, "dur": 2.732, + "args": { + "External id": 448502,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008028830.569, "dur": 0.829, + "args": { + "External id": 448503,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008028847.357, "dur": 139.251, + "args": { + "External id": 448504,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008028861.967, "dur": 120.616, + "args": { + "External id": 448505,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008028877.767, "dur": 13.158, + "args": { + "External id": 448506,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008028895.029, "dur": 61.018, + "args": { + "External id": 448507,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008028897.671, "dur": 58.059, + "args": { + "External id": 448508,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008028902.757, "dur": 5.915, + "args": { + "External id": 448509,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008028910.436, "dur": 44.730, + "args": { + "External id": 448510,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2045 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.15", "pid": 4183441, "tid": 31362, + "ts": 676008029121.733, "dur": 598.631, + "args": { + "External id": 448511,"Record function id": 0, "Ev Idx": 2046 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 4183441, "tid": 31362, + "ts": 676008029138.822, "dur": 567.725, + "args": { + "External id": 448512,"Record function id": 0, "Ev Idx": 2047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008029216.510, "dur": 5.564, + "args": { + "External id": 448513,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008029238.391, "dur": 31.019, + "args": { + "External id": 448514,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029242.824, "dur": 1.590, + "args": { + "External id": 448515,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029247.325, "dur": 0.485, + "args": { + "External id": 448516,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029249.005, "dur": 0.315, + "args": { + "External id": 448517,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029250.905, "dur": 3.906, + "args": { + "External id": 448518,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029256.264, "dur": 0.335, + "args": { + "External id": 448519,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029257.804, "dur": 0.368, + "args": { + "External id": 448520,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029260.711, "dur": 0.307, + "args": { + "External id": 448521,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029262.451, "dur": 0.342, + "args": { + "External id": 448522,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029263.864, "dur": 0.280, + "args": { + "External id": 448523,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008029280.037, "dur": 32.521, + "args": { + "External id": 448524,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008029342.600, "dur": 96.108, + "args": { + "External id": 448525,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008029352.246, "dur": 3.559, + "args": { + "External id": 448526,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008029360.452, "dur": 10.458, + "args": { + "External id": 448527,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008029364.179, "dur": 6.315, + "args": { + "External id": 448528,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029367.286, "dur": 2.019, + "args": { + "External id": 448529,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008029378.050, "dur": 23.281, + "args": { + "External id": 448530,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029379.552, "dur": 1.986, + "args": { + "External id": 448531,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029382.364, "dur": 0.619, + "args": { + "External id": 448532,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029384.206, "dur": 0.330, + "args": { + "External id": 448533,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029386.129, "dur": 0.468, + "args": { + "External id": 448534,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029387.703, "dur": 0.269, + "args": { + "External id": 448535,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029388.893, "dur": 1.341, + "args": { + "External id": 448536,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029390.893, "dur": 0.300, + "args": { + "External id": 448537,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029392.324, "dur": 0.243, + "args": { + "External id": 448538,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008029395.263, "dur": 2.016, + "args": { + "External id": 448539,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008029412.984, "dur": 18.135, + "args": { + "External id": 448540,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008029481.819, "dur": 112.872, + "args": { + "External id": 448541,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008029508.838, "dur": 82.471, + "args": { + "External id": 448542,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2077, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008029518.293, "dur": 69.095, + "args": { + "External id": 448543,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008029610.141, "dur": 1.924, + "args": { + "External id": 448544,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2079, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008029735.799, "dur": 1570.736, + "args": { + "External id": 448545,"Sequence number": 5285422, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2080 + } + }, + { + "ph": "f", "id": 178, "pid": 4183441, "tid": 31362, "ts": 676008029735.799, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008029848.186, "dur": 100.544, + "args": { + "External id": 448546,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008029988.457, "dur": 38.608, + "args": { + "External id": 448547,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008030045.709, "dur": 57.261, + "args": { + "External id": 448548,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030115.327, "dur": 31.473, + "args": { + "External id": 448549,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030152.716, "dur": 33.282, + "args": { + "External id": 448550,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030192.566, "dur": 22.373, + "args": { + "External id": 448551,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030224.063, "dur": 30.322, + "args": { + "External id": 448552,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008030278.759, "dur": 22.226, + "args": { + "External id": 448553,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008030318.662, "dur": 26.843, + "args": { + "External id": 448554,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008030365.135, "dur": 19.245, + "args": { + "External id": 448555,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008030397.462, "dur": 14.939, + "args": { + "External id": 448556,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030421.355, "dur": 36.853, + "args": { + "External id": 448557,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030461.157, "dur": 30.798, + "args": { + "External id": 448558,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008030524.454, "dur": 204.020, + "args": { + "External id": 448559,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008030601.916, "dur": 6.245, + "args": { + "External id": 448560,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008030609.908, "dur": 1.899, + "args": { + "External id": 448561,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008030765.140, "dur": 27.012, + "args": { + "External id": 448562,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008030803.665, "dur": 14.561, + "args": { + "External id": 448563,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030826.338, "dur": 50.516, + "args": { + "External id": 448564,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030884.232, "dur": 32.043, + "args": { + "External id": 448565,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030922.443, "dur": 27.738, + "args": { + "External id": 448566,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030954.370, "dur": 28.352, + "args": { + "External id": 448567,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008030987.859, "dur": 28.087, + "args": { + "External id": 448568,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008031026.476, "dur": 28.459, + "args": { + "External id": 448569,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008031097.626, "dur": 33.304, + "args": { + "External id": 448570,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008031156.748, "dur": 24.279, + "args": { + "External id": 448571,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008031196.636, "dur": 20.085, + "args": { + "External id": 448572,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008031233.901, "dur": 14.986, + "args": { + "External id": 448573,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008031263.348, "dur": 15.405, + "args": { + "External id": 448574,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031353.771, "dur": 15.925, + "args": { + "External id": 448575,"Record function id": 0, "Ev Idx": 2110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031357.176, "dur": 11.633, + "args": { + "External id": 448576,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031361.097, "dur": 6.721, + "args": { + "External id": 448577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031362.362, "dur": 5.345, + "args": { + "External id": 448578,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031373.471, "dur": 4.789, + "args": { + "External id": 448579,"Record function id": 0, "Ev Idx": 2114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031375.143, "dur": 2.640, + "args": { + "External id": 448580,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031375.773, "dur": 1.369, + "args": { + "External id": 448581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031376.270, "dur": 0.786, + "args": { + "External id": 448582,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031381.522, "dur": 7.111, + "args": { + "External id": 448583,"Record function id": 0, "Ev Idx": 2118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031383.211, "dur": 2.194, + "args": { + "External id": 448584,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031383.688, "dur": 1.317, + "args": { + "External id": 448585,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031384.187, "dur": 0.726, + "args": { + "External id": 448586,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031391.992, "dur": 4.047, + "args": { + "External id": 448587,"Record function id": 0, "Ev Idx": 2122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031393.571, "dur": 2.042, + "args": { + "External id": 448588,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031394.053, "dur": 1.126, + "args": { + "External id": 448589,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031394.393, "dur": 0.713, + "args": { + "External id": 448590,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031399.481, "dur": 5.291, + "args": { + "External id": 448591,"Record function id": 0, "Ev Idx": 2126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031400.648, "dur": 3.705, + "args": { + "External id": 448592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031401.269, "dur": 2.649, + "args": { + "External id": 448593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031403.173, "dur": 0.629, + "args": { + "External id": 448594,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031407.995, "dur": 3.520, + "args": { + "External id": 448595,"Record function id": 0, "Ev Idx": 2130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031409.233, "dur": 1.888, + "args": { + "External id": 448596,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031409.677, "dur": 1.036, + "args": { + "External id": 448597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031409.955, "dur": 0.645, + "args": { + "External id": 448598,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031414.894, "dur": 3.985, + "args": { + "External id": 448599,"Record function id": 0, "Ev Idx": 2134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031416.388, "dur": 2.087, + "args": { + "External id": 448600,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031416.821, "dur": 1.074, + "args": { + "External id": 448601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031417.085, "dur": 0.743, + "args": { + "External id": 448602,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031421.886, "dur": 5.413, + "args": { + "External id": 448603,"Record function id": 0, "Ev Idx": 2138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031423.088, "dur": 3.810, + "args": { + "External id": 448604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031423.537, "dur": 2.917, + "args": { + "External id": 448605,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031423.967, "dur": 2.401, + "args": { + "External id": 448606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031430.391, "dur": 5.488, + "args": { + "External id": 448607,"Record function id": 0, "Ev Idx": 2142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008031431.712, "dur": 3.760, + "args": { + "External id": 448608,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008031432.306, "dur": 2.535, + "args": { + "External id": 448609,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008031433.994, "dur": 0.757, + "args": { + "External id": 448610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008031439.870, "dur": 16906.181, + "args": { + "External id": 448611,"Record function id": 0, "Sequence number": 5285421, "Fwd thread id": 1, "Ev Idx": 2146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008031441.362, "dur": 16896.419, + "args": { + "External id": 448612,"Sequence number": 5285421, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2147 + } + }, + { + "ph": "f", "id": 179, "pid": 4183441, "tid": 31362, "ts": 676008031441.362, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.16)", "pid": 4183441, "tid": 31362, + "ts": 676008031470.981, "dur": 37.257, + "args": { + "External id": 448613,"Record function id": 0, "Ev Idx": 2148 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.16)", "pid": 4183441, "tid": 31362, + "ts": 676008031516.427, "dur": 65.709, + "args": { + "External id": 448614,"Record function id": 0, "Ev Idx": 2149 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.16)", "pid": 4183441, "tid": 31362, + "ts": 676008031588.131, "dur": 16741.906, + "args": { + "External id": 448615,"Record function id": 0, "Ev Idx": 2150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008031709.904, "dur": 7.449, + "args": { + "External id": 448616,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008031728.645, "dur": 4.831, + "args": { + "External id": 448617,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008031747.399, "dur": 15838.684, + "args": { + "External id": 448618,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008031760.857, "dur": 15817.396, + "args": { + "External id": 448619,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008031790.360, "dur": 13.504, + "args": { + "External id": 448620,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008031808.041, "dur": 15737.373, + "args": { + "External id": 448621,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008031811.564, "dur": 15733.095, + "args": { + "External id": 448622,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008031815.431, "dur": 4.668, + "args": { + "External id": 448623,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008031821.574, "dur": 15719.722, + "args": { + "External id": 448624,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008047700.982, "dur": 9.765, + "args": { + "External id": 448625,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008047704.026, "dur": 6.198, + "args": { + "External id": 448626,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008047738.451, "dur": 293.688, + "args": { + "External id": 448627,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008047763.988, "dur": 263.720, + "args": { + "External id": 448628,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2163, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008047774.895, "dur": 247.010, + "args": { + "External id": 448629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008048047.851, "dur": 2.077, + "args": { + "External id": 448630,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2165, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048123.176, "dur": 6.245, + "args": { + "External id": 448631,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048175.445, "dur": 1.110, + "args": { + "External id": 448632,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048192.784, "dur": 1.282, + "args": { + "External id": 448633,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048206.671, "dur": 0.830, + "args": { + "External id": 448634,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048220.712, "dur": 0.845, + "args": { + "External id": 448635,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048233.591, "dur": 0.733, + "args": { + "External id": 448636,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048244.441, "dur": 0.874, + "args": { + "External id": 448637,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048257.617, "dur": 1.560, + "args": { + "External id": 448638,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048268.417, "dur": 0.660, + "args": { + "External id": 448639,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008048360.890, "dur": 2618.862, + "args": { + "External id": 448640,"Record function id": 0, "Ev Idx": 2175 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.15)", "pid": 4183441, "tid": 31362, + "ts": 676008048379.537, "dur": 984.939, + "args": { + "External id": 448641,"Record function id": 0, "Ev Idx": 2176 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 4183441, "tid": 31362, + "ts": 676008048394.958, "dur": 331.420, + "args": { + "External id": 448642,"Record function id": 0, "Ev Idx": 2177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048475.900, "dur": 3.995, + "args": { + "External id": 448643,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048483.012, "dur": 1.052, + "args": { + "External id": 448644,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048485.663, "dur": 0.876, + "args": { + "External id": 448645,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048488.002, "dur": 0.915, + "args": { + "External id": 448646,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048490.259, "dur": 0.716, + "args": { + "External id": 448647,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048493.539, "dur": 0.733, + "args": { + "External id": 448648,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048495.587, "dur": 1.341, + "args": { + "External id": 448649,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048498.040, "dur": 2.213, + "args": { + "External id": 448650,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048501.887, "dur": 0.765, + "args": { + "External id": 448651,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008048505.075, "dur": 0.742, + "args": { + "External id": 448652,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008048522.194, "dur": 172.601, + "args": { + "External id": 448653,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008048536.920, "dur": 152.689, + "args": { + "External id": 448654,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008048551.565, "dur": 12.727, + "args": { + "External id": 448655,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008048566.811, "dur": 59.713, + "args": { + "External id": 448656,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008048570.613, "dur": 55.583, + "args": { + "External id": 448657,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048574.197, "dur": 5.158, + "args": { + "External id": 448658,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008048580.927, "dur": 44.726, + "args": { + "External id": 448659,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2194 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.14", "pid": 4183441, "tid": 31362, + "ts": 676008048821.353, "dur": 535.917, + "args": { + "External id": 448660,"Record function id": 0, "Ev Idx": 2195 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 4183441, "tid": 31362, + "ts": 676008048839.781, "dur": 505.796, + "args": { + "External id": 448661,"Record function id": 0, "Ev Idx": 2196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008048900.551, "dur": 5.357, + "args": { + "External id": 448662,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008048920.930, "dur": 25.098, + "args": { + "External id": 448663,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048924.536, "dur": 1.340, + "args": { + "External id": 448664,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048928.585, "dur": 0.362, + "args": { + "External id": 448665,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048929.998, "dur": 2.297, + "args": { + "External id": 448666,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048933.145, "dur": 0.277, + "args": { + "External id": 448667,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048935.328, "dur": 0.440, + "args": { + "External id": 448668,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048936.499, "dur": 0.245, + "args": { + "External id": 448669,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048937.676, "dur": 1.191, + "args": { + "External id": 448670,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048939.528, "dur": 0.438, + "args": { + "External id": 448671,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008048941.121, "dur": 0.397, + "args": { + "External id": 448672,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008048955.685, "dur": 31.547, + "args": { + "External id": 448673,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008049018.584, "dur": 111.031, + "args": { + "External id": 448674,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008049028.037, "dur": 3.381, + "args": { + "External id": 448675,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008049036.306, "dur": 10.054, + "args": { + "External id": 448676,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008049040.160, "dur": 5.818, + "args": { + "External id": 448677,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049043.039, "dur": 1.761, + "args": { + "External id": 448678,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008049052.598, "dur": 21.441, + "args": { + "External id": 448679,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049053.873, "dur": 1.738, + "args": { + "External id": 448680,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049056.345, "dur": 0.356, + "args": { + "External id": 448681,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049057.404, "dur": 0.350, + "args": { + "External id": 448682,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049059.694, "dur": 0.302, + "args": { + "External id": 448683,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049060.789, "dur": 0.319, + "args": { + "External id": 448684,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049061.799, "dur": 0.262, + "args": { + "External id": 448685,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049063.842, "dur": 0.254, + "args": { + "External id": 448686,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049065.338, "dur": 1.781, + "args": { + "External id": 448687,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008049067.977, "dur": 1.893, + "args": { + "External id": 448688,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008049099.666, "dur": 21.586, + "args": { + "External id": 448689,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008049174.637, "dur": 107.933, + "args": { + "External id": 448690,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008049197.163, "dur": 82.205, + "args": { + "External id": 448691,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2226, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008049205.778, "dur": 69.763, + "args": { + "External id": 448692,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008049296.246, "dur": 1.684, + "args": { + "External id": 448693,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2228, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008049372.758, "dur": 1584.928, + "args": { + "External id": 448694,"Sequence number": 5285420, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2229 + } + }, + { + "ph": "f", "id": 180, "pid": 4183441, "tid": 31362, "ts": 676008049372.758, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008049481.635, "dur": 95.790, + "args": { + "External id": 448695,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008049619.165, "dur": 81.331, + "args": { + "External id": 448696,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008049723.613, "dur": 46.382, + "args": { + "External id": 448697,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008049779.208, "dur": 29.342, + "args": { + "External id": 448698,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008049814.381, "dur": 34.820, + "args": { + "External id": 448699,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008049855.755, "dur": 22.490, + "args": { + "External id": 448700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008049887.660, "dur": 29.494, + "args": { + "External id": 448701,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008049942.006, "dur": 24.376, + "args": { + "External id": 448702,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008049983.112, "dur": 25.603, + "args": { + "External id": 448703,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008050025.600, "dur": 18.651, + "args": { + "External id": 448704,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008050056.361, "dur": 15.489, + "args": { + "External id": 448705,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050081.093, "dur": 58.002, + "args": { + "External id": 448706,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050144.176, "dur": 39.891, + "args": { + "External id": 448707,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008050211.678, "dur": 169.251, + "args": { + "External id": 448708,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008050290.813, "dur": 4.913, + "args": { + "External id": 448709,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008050297.329, "dur": 1.964, + "args": { + "External id": 448710,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008050412.801, "dur": 26.689, + "args": { + "External id": 448711,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008050450.445, "dur": 14.387, + "args": { + "External id": 448712,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050473.653, "dur": 42.543, + "args": { + "External id": 448713,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050521.546, "dur": 31.163, + "args": { + "External id": 448714,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050564.507, "dur": 27.969, + "args": { + "External id": 448715,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050596.811, "dur": 27.814, + "args": { + "External id": 448716,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050631.189, "dur": 62.193, + "args": { + "External id": 448717,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008050705.087, "dur": 31.678, + "args": { + "External id": 448718,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008050754.205, "dur": 22.105, + "args": { + "External id": 448719,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008050793.282, "dur": 34.698, + "args": { + "External id": 448720,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008050848.710, "dur": 20.109, + "args": { + "External id": 448721,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008050884.285, "dur": 14.331, + "args": { + "External id": 448722,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008050908.792, "dur": 16.279, + "args": { + "External id": 448723,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051005.384, "dur": 13.924, + "args": { + "External id": 448724,"Record function id": 0, "Ev Idx": 2259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051008.776, "dur": 9.772, + "args": { + "External id": 448725,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051012.654, "dur": 5.074, + "args": { + "External id": 448726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051013.858, "dur": 3.777, + "args": { + "External id": 448727,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051023.056, "dur": 4.652, + "args": { + "External id": 448728,"Record function id": 0, "Ev Idx": 2263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051024.812, "dur": 2.444, + "args": { + "External id": 448729,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051025.648, "dur": 1.081, + "args": { + "External id": 448730,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051026.009, "dur": 0.634, + "args": { + "External id": 448731,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051030.906, "dur": 4.004, + "args": { + "External id": 448732,"Record function id": 0, "Ev Idx": 2267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051032.099, "dur": 2.431, + "args": { + "External id": 448733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051032.552, "dur": 1.584, + "args": { + "External id": 448734,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051033.055, "dur": 0.998, + "args": { + "External id": 448735,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051038.016, "dur": 3.471, + "args": { + "External id": 448736,"Record function id": 0, "Ev Idx": 2271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051039.024, "dur": 2.068, + "args": { + "External id": 448737,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051039.533, "dur": 1.018, + "args": { + "External id": 448738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051039.879, "dur": 0.599, + "args": { + "External id": 448739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051044.552, "dur": 3.235, + "args": { + "External id": 448740,"Record function id": 0, "Ev Idx": 2275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051045.480, "dur": 1.914, + "args": { + "External id": 448741,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051045.954, "dur": 1.028, + "args": { + "External id": 448742,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051046.323, "dur": 0.588, + "args": { + "External id": 448743,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051051.030, "dur": 7.129, + "args": { + "External id": 448744,"Record function id": 0, "Ev Idx": 2279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051052.222, "dur": 5.557, + "args": { + "External id": 448745,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051052.846, "dur": 4.327, + "args": { + "External id": 448746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051056.467, "dur": 0.633, + "args": { + "External id": 448747,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051061.338, "dur": 5.351, + "args": { + "External id": 448748,"Record function id": 0, "Ev Idx": 2283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051062.444, "dur": 3.862, + "args": { + "External id": 448749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051063.070, "dur": 2.853, + "args": { + "External id": 448750,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051063.427, "dur": 2.429, + "args": { + "External id": 448751,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051069.956, "dur": 3.587, + "args": { + "External id": 448752,"Record function id": 0, "Ev Idx": 2287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051070.975, "dur": 2.176, + "args": { + "External id": 448753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051071.419, "dur": 1.347, + "args": { + "External id": 448754,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051071.758, "dur": 0.936, + "args": { + "External id": 448755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051076.579, "dur": 3.286, + "args": { + "External id": 448756,"Record function id": 0, "Ev Idx": 2291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008051077.699, "dur": 1.768, + "args": { + "External id": 448757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008051078.142, "dur": 0.941, + "args": { + "External id": 448758,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008051078.442, "dur": 0.569, + "args": { + "External id": 448759,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008051099.663, "dur": 14997.509, + "args": { + "External id": 448760,"Record function id": 0, "Sequence number": 5285419, "Fwd thread id": 1, "Ev Idx": 2295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008051101.524, "dur": 14972.476, + "args": { + "External id": 448761,"Sequence number": 5285419, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2296 + } + }, + { + "ph": "f", "id": 181, "pid": 4183441, "tid": 31362, "ts": 676008051101.524, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.15)", "pid": 4183441, "tid": 31362, + "ts": 676008051135.381, "dur": 41.789, + "args": { + "External id": 448762,"Record function id": 0, "Ev Idx": 2297 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.15)", "pid": 4183441, "tid": 31362, + "ts": 676008051184.968, "dur": 72.164, + "args": { + "External id": 448763,"Record function id": 0, "Ev Idx": 2298 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.15)", "pid": 4183441, "tid": 31362, + "ts": 676008051262.650, "dur": 14804.318, + "args": { + "External id": 448764,"Record function id": 0, "Ev Idx": 2299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008051356.026, "dur": 6.754, + "args": { + "External id": 448765,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008051372.070, "dur": 4.645, + "args": { + "External id": 448766,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008051389.241, "dur": 13977.222, + "args": { + "External id": 448767,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008051402.025, "dur": 13956.103, + "args": { + "External id": 448768,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008051427.235, "dur": 13.565, + "args": { + "External id": 448769,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008051445.244, "dur": 13878.102, + "args": { + "External id": 448770,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008051449.264, "dur": 13873.357, + "args": { + "External id": 448771,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008051452.473, "dur": 4.473, + "args": { + "External id": 448772,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008051458.340, "dur": 13860.737, + "args": { + "External id": 448773,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008065450.411, "dur": 9.152, + "args": { + "External id": 448774,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008065453.274, "dur": 5.862, + "args": { + "External id": 448775,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008065486.298, "dur": 306.169, + "args": { + "External id": 448776,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008065513.498, "dur": 274.185, + "args": { + "External id": 448777,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2312, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008065524.949, "dur": 257.501, + "args": { + "External id": 448778,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008065812.164, "dur": 2.057, + "args": { + "External id": 448779,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2314, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065868.517, "dur": 7.587, + "args": { + "External id": 448780,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065918.649, "dur": 1.083, + "args": { + "External id": 448781,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065935.561, "dur": 1.170, + "args": { + "External id": 448782,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065948.045, "dur": 0.800, + "args": { + "External id": 448783,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065960.702, "dur": 2.243, + "args": { + "External id": 448784,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065972.934, "dur": 0.736, + "args": { + "External id": 448785,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065983.908, "dur": 0.935, + "args": { + "External id": 448786,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008065996.041, "dur": 2.147, + "args": { + "External id": 448787,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066008.358, "dur": 2.519, + "args": { + "External id": 448788,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008066112.375, "dur": 2670.200, + "args": { + "External id": 448789,"Record function id": 0, "Ev Idx": 2324 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.14)", "pid": 4183441, "tid": 31362, + "ts": 676008066132.876, "dur": 992.144, + "args": { + "External id": 448790,"Record function id": 0, "Ev Idx": 2325 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 4183441, "tid": 31362, + "ts": 676008066147.873, "dur": 291.348, + "args": { + "External id": 448791,"Record function id": 0, "Ev Idx": 2326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066229.605, "dur": 4.413, + "args": { + "External id": 448792,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066237.762, "dur": 0.792, + "args": { + "External id": 448793,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066240.348, "dur": 0.908, + "args": { + "External id": 448794,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066243.193, "dur": 0.783, + "args": { + "External id": 448795,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066245.592, "dur": 0.678, + "args": { + "External id": 448796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066247.929, "dur": 0.875, + "args": { + "External id": 448797,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066250.459, "dur": 4.355, + "args": { + "External id": 448798,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066256.427, "dur": 0.751, + "args": { + "External id": 448799,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066258.932, "dur": 1.001, + "args": { + "External id": 448800,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008066261.551, "dur": 0.736, + "args": { + "External id": 448801,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008066279.051, "dur": 133.780, + "args": { + "External id": 448802,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008066293.878, "dur": 115.123, + "args": { + "External id": 448803,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008066307.734, "dur": 12.483, + "args": { + "External id": 448804,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008066322.900, "dur": 58.473, + "args": { + "External id": 448805,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008066325.296, "dur": 55.768, + "args": { + "External id": 448806,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066328.420, "dur": 5.345, + "args": { + "External id": 448807,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008066335.503, "dur": 44.965, + "args": { + "External id": 448808,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2343 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.13", "pid": 4183441, "tid": 31362, + "ts": 676008066526.537, "dur": 590.924, + "args": { + "External id": 448809,"Record function id": 0, "Ev Idx": 2344 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 4183441, "tid": 31362, + "ts": 676008066542.681, "dur": 559.782, + "args": { + "External id": 448810,"Record function id": 0, "Ev Idx": 2345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008066600.618, "dur": 4.512, + "args": { + "External id": 448811,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008066619.955, "dur": 29.987, + "args": { + "External id": 448812,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066624.384, "dur": 2.355, + "args": { + "External id": 448813,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066628.440, "dur": 2.020, + "args": { + "External id": 448814,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066631.964, "dur": 0.408, + "args": { + "External id": 448815,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066634.969, "dur": 0.335, + "args": { + "External id": 448816,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066636.426, "dur": 0.593, + "args": { + "External id": 448817,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066638.520, "dur": 0.258, + "args": { + "External id": 448818,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066641.102, "dur": 0.356, + "args": { + "External id": 448819,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066642.692, "dur": 0.380, + "args": { + "External id": 448820,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066644.529, "dur": 0.949, + "args": { + "External id": 448821,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008066699.655, "dur": 32.706, + "args": { + "External id": 448822,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008066766.341, "dur": 101.525, + "args": { + "External id": 448823,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008066776.570, "dur": 6.585, + "args": { + "External id": 448824,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008066788.966, "dur": 10.203, + "args": { + "External id": 448825,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008066793.210, "dur": 5.558, + "args": { + "External id": 448826,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066796.741, "dur": 0.547, + "args": { + "External id": 448827,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008066806.278, "dur": 24.773, + "args": { + "External id": 448828,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066808.198, "dur": 0.310, + "args": { + "External id": 448829,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066810.255, "dur": 1.310, + "args": { + "External id": 448830,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066812.868, "dur": 0.298, + "args": { + "External id": 448831,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066814.608, "dur": 0.364, + "args": { + "External id": 448832,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066817.448, "dur": 0.437, + "args": { + "External id": 448833,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066819.295, "dur": 0.273, + "args": { + "External id": 448834,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066821.042, "dur": 1.770, + "args": { + "External id": 448835,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066825.440, "dur": 0.529, + "args": { + "External id": 448836,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008066827.200, "dur": 0.502, + "args": { + "External id": 448837,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008066842.985, "dur": 17.314, + "args": { + "External id": 448838,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008066911.929, "dur": 111.096, + "args": { + "External id": 448839,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008066937.064, "dur": 82.551, + "args": { + "External id": 448840,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2375, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008066946.696, "dur": 68.820, + "args": { + "External id": 448841,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008067037.114, "dur": 1.717, + "args": { + "External id": 448842,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2377, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008067132.297, "dur": 1625.360, + "args": { + "External id": 448843,"Sequence number": 5285418, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2378 + } + }, + { + "ph": "f", "id": 182, "pid": 4183441, "tid": 31362, "ts": 676008067132.297, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008067242.517, "dur": 106.394, + "args": { + "External id": 448844,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008067389.448, "dur": 38.972, + "args": { + "External id": 448845,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008067446.547, "dur": 40.160, + "args": { + "External id": 448846,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008067495.703, "dur": 27.573, + "args": { + "External id": 448847,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008067529.536, "dur": 36.975, + "args": { + "External id": 448848,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008067575.165, "dur": 26.094, + "args": { + "External id": 448849,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008067608.897, "dur": 30.068, + "args": { + "External id": 448850,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008067702.418, "dur": 27.029, + "args": { + "External id": 448851,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008067752.517, "dur": 27.096, + "args": { + "External id": 448852,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008067802.392, "dur": 20.817, + "args": { + "External id": 448853,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008067836.835, "dur": 14.807, + "args": { + "External id": 448854,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008067862.015, "dur": 42.671, + "args": { + "External id": 448855,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008067908.368, "dur": 31.322, + "args": { + "External id": 448856,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008067965.476, "dur": 184.578, + "args": { + "External id": 448857,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008068039.743, "dur": 5.454, + "args": { + "External id": 448858,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008068047.007, "dur": 4.835, + "args": { + "External id": 448859,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008068184.647, "dur": 25.495, + "args": { + "External id": 448860,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008068222.057, "dur": 16.206, + "args": { + "External id": 448861,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008068246.156, "dur": 49.404, + "args": { + "External id": 448862,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008068301.248, "dur": 31.343, + "args": { + "External id": 448863,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008068339.254, "dur": 28.188, + "args": { + "External id": 448864,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008068373.936, "dur": 28.697, + "args": { + "External id": 448865,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008068408.520, "dur": 27.357, + "args": { + "External id": 448866,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008068442.653, "dur": 28.381, + "args": { + "External id": 448867,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008068488.738, "dur": 22.739, + "args": { + "External id": 448868,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008068543.396, "dur": 30.653, + "args": { + "External id": 448869,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008068590.205, "dur": 17.385, + "args": { + "External id": 448870,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008068623.036, "dur": 17.110, + "args": { + "External id": 448871,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008068706.093, "dur": 20.457, + "args": { + "External id": 448872,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068803.707, "dur": 14.319, + "args": { + "External id": 448873,"Record function id": 0, "Ev Idx": 2408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068807.263, "dur": 9.959, + "args": { + "External id": 448874,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068811.313, "dur": 5.040, + "args": { + "External id": 448875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068812.511, "dur": 3.722, + "args": { + "External id": 448876,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068821.867, "dur": 4.491, + "args": { + "External id": 448877,"Record function id": 0, "Ev Idx": 2412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068823.346, "dur": 2.535, + "args": { + "External id": 448878,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068824.087, "dur": 1.386, + "args": { + "External id": 448879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068824.555, "dur": 0.839, + "args": { + "External id": 448880,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068829.571, "dur": 4.456, + "args": { + "External id": 448881,"Record function id": 0, "Ev Idx": 2416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068831.193, "dur": 2.422, + "args": { + "External id": 448882,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068831.720, "dur": 1.366, + "args": { + "External id": 448883,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068832.454, "dur": 0.567, + "args": { + "External id": 448884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068837.136, "dur": 5.591, + "args": { + "External id": 448885,"Record function id": 0, "Ev Idx": 2420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068838.591, "dur": 3.743, + "args": { + "External id": 448886,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068839.178, "dur": 2.772, + "args": { + "External id": 448887,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068839.481, "dur": 2.411, + "args": { + "External id": 448888,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068846.027, "dur": 4.250, + "args": { + "External id": 448889,"Record function id": 0, "Ev Idx": 2424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068847.090, "dur": 2.791, + "args": { + "External id": 448890,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068847.590, "dur": 1.528, + "args": { + "External id": 448891,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068848.143, "dur": 0.911, + "args": { + "External id": 448892,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068853.615, "dur": 3.750, + "args": { + "External id": 448893,"Record function id": 0, "Ev Idx": 2428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068854.689, "dur": 2.269, + "args": { + "External id": 448894,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068855.210, "dur": 1.357, + "args": { + "External id": 448895,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068855.818, "dur": 0.684, + "args": { + "External id": 448896,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068860.580, "dur": 4.175, + "args": { + "External id": 448897,"Record function id": 0, "Ev Idx": 2432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068862.024, "dur": 2.341, + "args": { + "External id": 448898,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068862.565, "dur": 1.413, + "args": { + "External id": 448899,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068863.311, "dur": 0.601, + "args": { + "External id": 448900,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068867.965, "dur": 3.481, + "args": { + "External id": 448901,"Record function id": 0, "Ev Idx": 2436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068869.070, "dur": 1.980, + "args": { + "External id": 448902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068869.567, "dur": 1.095, + "args": { + "External id": 448903,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068870.043, "dur": 0.555, + "args": { + "External id": 448904,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068874.576, "dur": 3.776, + "args": { + "External id": 448905,"Record function id": 0, "Ev Idx": 2440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008068875.721, "dur": 2.236, + "args": { + "External id": 448906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008068876.271, "dur": 1.274, + "args": { + "External id": 448907,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008068876.783, "dur": 0.698, + "args": { + "External id": 448908,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008068881.963, "dur": 15006.228, + "args": { + "External id": 448909,"Record function id": 0, "Sequence number": 5285417, "Fwd thread id": 1, "Ev Idx": 2444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008068883.010, "dur": 14996.521, + "args": { + "External id": 448910,"Sequence number": 5285417, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2445 + } + }, + { + "ph": "f", "id": 183, "pid": 4183441, "tid": 31362, "ts": 676008068883.010, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.14)", "pid": 4183441, "tid": 31362, + "ts": 676008068911.580, "dur": 36.338, + "args": { + "External id": 448911,"Record function id": 0, "Ev Idx": 2446 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.14)", "pid": 4183441, "tid": 31362, + "ts": 676008068955.298, "dur": 65.173, + "args": { + "External id": 448912,"Record function id": 0, "Ev Idx": 2447 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.14)", "pid": 4183441, "tid": 31362, + "ts": 676008069026.048, "dur": 14845.813, + "args": { + "External id": 448913,"Record function id": 0, "Ev Idx": 2448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008069130.215, "dur": 11.327, + "args": { + "External id": 448914,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008069151.459, "dur": 4.829, + "args": { + "External id": 448915,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008069171.079, "dur": 14029.897, + "args": { + "External id": 448916,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008069184.570, "dur": 14008.454, + "args": { + "External id": 448917,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008069207.438, "dur": 14.986, + "args": { + "External id": 448918,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008069226.770, "dur": 13930.711, + "args": { + "External id": 448919,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008069229.292, "dur": 13927.546, + "args": { + "External id": 448920,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008069233.881, "dur": 4.695, + "args": { + "External id": 448921,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008069240.237, "dur": 13912.946, + "args": { + "External id": 448922,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008083284.047, "dur": 8.954, + "args": { + "External id": 448923,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008083286.746, "dur": 5.877, + "args": { + "External id": 448924,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008083321.422, "dur": 251.697, + "args": { + "External id": 448925,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008083348.642, "dur": 220.515, + "args": { + "External id": 448926,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2461, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008083360.712, "dur": 203.981, + "args": { + "External id": 448927,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008083590.516, "dur": 1.989, + "args": { + "External id": 448928,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2463, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083639.369, "dur": 5.644, + "args": { + "External id": 448929,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083720.697, "dur": 2.167, + "args": { + "External id": 448930,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083738.537, "dur": 1.381, + "args": { + "External id": 448931,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083753.211, "dur": 1.156, + "args": { + "External id": 448932,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083764.481, "dur": 1.167, + "args": { + "External id": 448933,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083775.844, "dur": 0.817, + "args": { + "External id": 448934,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083788.071, "dur": 0.728, + "args": { + "External id": 448935,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083801.482, "dur": 1.887, + "args": { + "External id": 448936,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008083813.370, "dur": 0.815, + "args": { + "External id": 448937,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008083903.039, "dur": 2551.123, + "args": { + "External id": 448938,"Record function id": 0, "Ev Idx": 2473 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.13)", "pid": 4183441, "tid": 31362, + "ts": 676008083920.704, "dur": 974.250, + "args": { + "External id": 448939,"Record function id": 0, "Ev Idx": 2474 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 4183441, "tid": 31362, + "ts": 676008083933.608, "dur": 313.604, + "args": { + "External id": 448940,"Record function id": 0, "Ev Idx": 2475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084013.326, "dur": 3.827, + "args": { + "External id": 448941,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084020.486, "dur": 1.005, + "args": { + "External id": 448942,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084023.470, "dur": 0.835, + "args": { + "External id": 448943,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084026.284, "dur": 2.561, + "args": { + "External id": 448944,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084030.707, "dur": 0.936, + "args": { + "External id": 448945,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084033.301, "dur": 0.719, + "args": { + "External id": 448946,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084035.683, "dur": 1.606, + "args": { + "External id": 448947,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084038.894, "dur": 0.942, + "args": { + "External id": 448948,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084042.032, "dur": 0.747, + "args": { + "External id": 448949,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008084044.447, "dur": 0.882, + "args": { + "External id": 448950,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008084062.328, "dur": 157.334, + "args": { + "External id": 448951,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008084097.157, "dur": 117.816, + "args": { + "External id": 448952,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008084111.405, "dur": 11.373, + "args": { + "External id": 448953,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008084125.435, "dur": 62.384, + "args": { + "External id": 448954,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008084127.984, "dur": 59.530, + "args": { + "External id": 448955,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084131.849, "dur": 7.723, + "args": { + "External id": 448956,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008084141.124, "dur": 45.830, + "args": { + "External id": 448957,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2492 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.12", "pid": 4183441, "tid": 31362, + "ts": 676008084331.403, "dur": 556.361, + "args": { + "External id": 448958,"Record function id": 0, "Ev Idx": 2493 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 4183441, "tid": 31362, + "ts": 676008084348.818, "dur": 527.016, + "args": { + "External id": 448959,"Record function id": 0, "Ev Idx": 2494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008084407.768, "dur": 4.602, + "args": { + "External id": 448960,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008084427.432, "dur": 29.737, + "args": { + "External id": 448961,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084431.945, "dur": 1.271, + "args": { + "External id": 448962,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084435.617, "dur": 0.490, + "args": { + "External id": 448963,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084437.477, "dur": 0.314, + "args": { + "External id": 448964,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084439.759, "dur": 0.531, + "args": { + "External id": 448965,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084441.617, "dur": 0.480, + "args": { + "External id": 448966,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084443.497, "dur": 0.706, + "args": { + "External id": 448967,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084445.676, "dur": 2.129, + "args": { + "External id": 448968,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084449.450, "dur": 0.421, + "args": { + "External id": 448969,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084452.342, "dur": 0.375, + "args": { + "External id": 448970,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008084467.687, "dur": 29.584, + "args": { + "External id": 448971,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008084527.579, "dur": 98.292, + "args": { + "External id": 448972,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008084537.119, "dur": 3.476, + "args": { + "External id": 448973,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008084545.641, "dur": 9.440, + "args": { + "External id": 448974,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008084549.466, "dur": 5.217, + "args": { + "External id": 448975,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084552.883, "dur": 0.702, + "args": { + "External id": 448976,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008084561.925, "dur": 27.243, + "args": { + "External id": 448977,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084564.079, "dur": 0.450, + "args": { + "External id": 448978,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084566.051, "dur": 0.350, + "args": { + "External id": 448979,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084568.279, "dur": 0.326, + "args": { + "External id": 448980,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084569.826, "dur": 2.184, + "args": { + "External id": 448981,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084577.193, "dur": 0.420, + "args": { + "External id": 448982,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084579.668, "dur": 0.387, + "args": { + "External id": 448983,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084581.288, "dur": 0.374, + "args": { + "External id": 448984,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084582.940, "dur": 0.745, + "args": { + "External id": 448985,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008084585.220, "dur": 0.338, + "args": { + "External id": 448986,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008084600.079, "dur": 19.017, + "args": { + "External id": 448987,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008084702.340, "dur": 110.162, + "args": { + "External id": 448988,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008084726.768, "dur": 82.518, + "args": { + "External id": 448989,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2524, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008084736.584, "dur": 68.778, + "args": { + "External id": 448990,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008084826.843, "dur": 1.670, + "args": { + "External id": 448991,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2526, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008084901.734, "dur": 1531.115, + "args": { + "External id": 448992,"Sequence number": 5285416, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2527 + } + }, + { + "ph": "f", "id": 184, "pid": 4183441, "tid": 31362, "ts": 676008084901.734, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085010.536, "dur": 116.154, + "args": { + "External id": 448993,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008085170.779, "dur": 39.174, + "args": { + "External id": 448994,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008085226.258, "dur": 44.121, + "args": { + "External id": 448995,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085279.538, "dur": 28.403, + "args": { + "External id": 448996,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085315.327, "dur": 32.839, + "args": { + "External id": 448997,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085355.013, "dur": 22.090, + "args": { + "External id": 448998,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085383.623, "dur": 28.624, + "args": { + "External id": 448999,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008085434.468, "dur": 19.970, + "args": { + "External id": 449000,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008085473.252, "dur": 24.968, + "args": { + "External id": 449001,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008085517.554, "dur": 17.264, + "args": { + "External id": 449002,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008085547.805, "dur": 12.531, + "args": { + "External id": 449003,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085568.331, "dur": 35.006, + "args": { + "External id": 449004,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085606.529, "dur": 30.044, + "args": { + "External id": 449005,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008085710.070, "dur": 164.240, + "args": { + "External id": 449006,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008085784.986, "dur": 6.243, + "args": { + "External id": 449007,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008085793.730, "dur": 3.136, + "args": { + "External id": 449008,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008085914.615, "dur": 23.563, + "args": { + "External id": 449009,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008085950.573, "dur": 12.996, + "args": { + "External id": 449010,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008085972.137, "dur": 47.855, + "args": { + "External id": 449011,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008086025.433, "dur": 30.880, + "args": { + "External id": 449012,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008086065.497, "dur": 41.097, + "args": { + "External id": 449013,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008086113.507, "dur": 31.291, + "args": { + "External id": 449014,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008086151.060, "dur": 27.937, + "args": { + "External id": 449015,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008086185.785, "dur": 28.513, + "args": { + "External id": 449016,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008086233.262, "dur": 21.768, + "args": { + "External id": 449017,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008086271.232, "dur": 23.496, + "args": { + "External id": 449018,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008086308.182, "dur": 31.562, + "args": { + "External id": 449019,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008086364.487, "dur": 13.398, + "args": { + "External id": 449020,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008086388.759, "dur": 14.960, + "args": { + "External id": 449021,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086479.142, "dur": 34.588, + "args": { + "External id": 449022,"Record function id": 0, "Ev Idx": 2557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086482.171, "dur": 30.826, + "args": { + "External id": 449023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086485.955, "dur": 26.160, + "args": { + "External id": 449024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086508.185, "dur": 3.835, + "args": { + "External id": 449025,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086518.350, "dur": 4.236, + "args": { + "External id": 449026,"Record function id": 0, "Ev Idx": 2561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086519.809, "dur": 2.306, + "args": { + "External id": 449027,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086520.469, "dur": 1.107, + "args": { + "External id": 449028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086520.788, "dur": 0.707, + "args": { + "External id": 449029,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086526.405, "dur": 5.379, + "args": { + "External id": 449030,"Record function id": 0, "Ev Idx": 2565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086527.547, "dur": 3.801, + "args": { + "External id": 449031,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086528.017, "dur": 2.927, + "args": { + "External id": 449032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086528.809, "dur": 2.069, + "args": { + "External id": 449033,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086538.504, "dur": 3.598, + "args": { + "External id": 449034,"Record function id": 0, "Ev Idx": 2569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086539.584, "dur": 2.119, + "args": { + "External id": 449035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086540.056, "dur": 1.234, + "args": { + "External id": 449036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086540.458, "dur": 0.768, + "args": { + "External id": 449037,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086545.762, "dur": 3.273, + "args": { + "External id": 449038,"Record function id": 0, "Ev Idx": 2573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086546.739, "dur": 1.905, + "args": { + "External id": 449039,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086547.168, "dur": 1.082, + "args": { + "External id": 449040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086547.643, "dur": 0.541, + "args": { + "External id": 449041,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086552.932, "dur": 3.453, + "args": { + "External id": 449042,"Record function id": 0, "Ev Idx": 2577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086554.041, "dur": 1.936, + "args": { + "External id": 449043,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086554.533, "dur": 1.028, + "args": { + "External id": 449044,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086554.875, "dur": 0.613, + "args": { + "External id": 449045,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086560.175, "dur": 3.659, + "args": { + "External id": 449046,"Record function id": 0, "Ev Idx": 2581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086561.164, "dur": 2.244, + "args": { + "External id": 449047,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086561.617, "dur": 1.280, + "args": { + "External id": 449048,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086562.188, "dur": 0.645, + "args": { + "External id": 449049,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086567.229, "dur": 3.131, + "args": { + "External id": 449050,"Record function id": 0, "Ev Idx": 2585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086568.101, "dur": 1.863, + "args": { + "External id": 449051,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086568.556, "dur": 0.985, + "args": { + "External id": 449052,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086568.894, "dur": 0.582, + "args": { + "External id": 449053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086574.065, "dur": 3.467, + "args": { + "External id": 449054,"Record function id": 0, "Ev Idx": 2589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008086575.133, "dur": 1.988, + "args": { + "External id": 449055,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008086575.567, "dur": 1.022, + "args": { + "External id": 449056,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008086575.978, "dur": 0.547, + "args": { + "External id": 449057,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008086582.028, "dur": 15029.167, + "args": { + "External id": 449058,"Record function id": 0, "Sequence number": 5285415, "Fwd thread id": 1, "Ev Idx": 2593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008086583.181, "dur": 15019.072, + "args": { + "External id": 449059,"Sequence number": 5285415, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2594 + } + }, + { + "ph": "f", "id": 185, "pid": 4183441, "tid": 31362, "ts": 676008086583.181, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.13)", "pid": 4183441, "tid": 31362, + "ts": 676008086612.134, "dur": 37.274, + "args": { + "External id": 449060,"Record function id": 0, "Ev Idx": 2595 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.13)", "pid": 4183441, "tid": 31362, + "ts": 676008086696.649, "dur": 67.551, + "args": { + "External id": 449061,"Record function id": 0, "Ev Idx": 2596 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.13)", "pid": 4183441, "tid": 31362, + "ts": 676008086770.100, "dur": 14824.427, + "args": { + "External id": 449062,"Record function id": 0, "Ev Idx": 2597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008086857.553, "dur": 7.549, + "args": { + "External id": 449063,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008086875.318, "dur": 6.176, + "args": { + "External id": 449064,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008086896.666, "dur": 13982.870, + "args": { + "External id": 449065,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008086909.467, "dur": 13961.275, + "args": { + "External id": 449066,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008086932.813, "dur": 17.012, + "args": { + "External id": 449067,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008086954.408, "dur": 13882.071, + "args": { + "External id": 449068,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008086956.826, "dur": 13878.613, + "args": { + "External id": 449069,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008086960.274, "dur": 6.050, + "args": { + "External id": 449070,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008086967.831, "dur": 13863.889, + "args": { + "External id": 449071,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008100967.747, "dur": 9.533, + "args": { + "External id": 449072,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008100970.767, "dur": 6.149, + "args": { + "External id": 449073,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008101003.786, "dur": 314.131, + "args": { + "External id": 449074,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008101031.360, "dur": 281.671, + "args": { + "External id": 449075,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2610, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008101042.396, "dur": 265.271, + "args": { + "External id": 449076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008101337.715, "dur": 2.438, + "args": { + "External id": 449077,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2612, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101394.686, "dur": 6.703, + "args": { + "External id": 449078,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101443.515, "dur": 1.348, + "args": { + "External id": 449079,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101460.806, "dur": 3.111, + "args": { + "External id": 449080,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101475.103, "dur": 0.796, + "args": { + "External id": 449081,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101486.849, "dur": 0.848, + "args": { + "External id": 449082,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101497.272, "dur": 0.761, + "args": { + "External id": 449083,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101508.770, "dur": 2.488, + "args": { + "External id": 449084,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101522.575, "dur": 1.818, + "args": { + "External id": 449085,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101534.428, "dur": 0.969, + "args": { + "External id": 449086,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008101624.723, "dur": 2661.854, + "args": { + "External id": 449087,"Record function id": 0, "Ev Idx": 2622 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.12)", "pid": 4183441, "tid": 31362, + "ts": 676008101644.137, "dur": 999.842, + "args": { + "External id": 449088,"Record function id": 0, "Ev Idx": 2623 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 4183441, "tid": 31362, + "ts": 676008101697.579, "dur": 314.345, + "args": { + "External id": 449089,"Record function id": 0, "Ev Idx": 2624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101789.242, "dur": 4.661, + "args": { + "External id": 449090,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101797.466, "dur": 0.851, + "args": { + "External id": 449091,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101800.030, "dur": 3.272, + "args": { + "External id": 449092,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101805.143, "dur": 1.032, + "args": { + "External id": 449093,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101808.108, "dur": 1.079, + "args": { + "External id": 449094,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101810.846, "dur": 1.213, + "args": { + "External id": 449095,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101813.983, "dur": 1.669, + "args": { + "External id": 449096,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101817.185, "dur": 0.979, + "args": { + "External id": 449097,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101820.205, "dur": 0.700, + "args": { + "External id": 449098,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008101822.687, "dur": 0.559, + "args": { + "External id": 449099,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008101841.780, "dur": 141.620, + "args": { + "External id": 449100,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008101857.196, "dur": 121.864, + "args": { + "External id": 449101,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008101874.639, "dur": 13.536, + "args": { + "External id": 449102,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008101890.821, "dur": 61.824, + "args": { + "External id": 449103,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008101893.378, "dur": 58.966, + "args": { + "External id": 449104,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008101897.634, "dur": 5.500, + "args": { + "External id": 449105,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008101904.805, "dur": 46.872, + "args": { + "External id": 449106,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2641 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.11", "pid": 4183441, "tid": 31362, + "ts": 676008102117.023, "dur": 519.389, + "args": { + "External id": 449107,"Record function id": 0, "Ev Idx": 2642 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 4183441, "tid": 31362, + "ts": 676008102133.376, "dur": 491.711, + "args": { + "External id": 449108,"Record function id": 0, "Ev Idx": 2643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008102196.747, "dur": 5.990, + "args": { + "External id": 449109,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008102217.334, "dur": 27.951, + "args": { + "External id": 449110,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102221.461, "dur": 1.422, + "args": { + "External id": 449111,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102224.402, "dur": 0.461, + "args": { + "External id": 449112,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102227.314, "dur": 0.335, + "args": { + "External id": 449113,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102228.752, "dur": 0.396, + "args": { + "External id": 449114,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102230.727, "dur": 1.241, + "args": { + "External id": 449115,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102233.104, "dur": 1.911, + "args": { + "External id": 449116,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102236.777, "dur": 0.471, + "args": { + "External id": 449117,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102239.711, "dur": 0.253, + "args": { + "External id": 449118,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102241.121, "dur": 0.377, + "args": { + "External id": 449119,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008102255.900, "dur": 31.759, + "args": { + "External id": 449120,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008102319.257, "dur": 92.800, + "args": { + "External id": 449121,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008102328.488, "dur": 3.547, + "args": { + "External id": 449122,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008102337.357, "dur": 9.254, + "args": { + "External id": 449123,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008102341.339, "dur": 4.845, + "args": { + "External id": 449124,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102344.581, "dur": 0.489, + "args": { + "External id": 449125,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008102353.073, "dur": 23.607, + "args": { + "External id": 449126,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102354.558, "dur": 0.435, + "args": { + "External id": 449127,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102357.747, "dur": 0.534, + "args": { + "External id": 449128,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102359.488, "dur": 1.959, + "args": { + "External id": 449129,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102362.512, "dur": 0.314, + "args": { + "External id": 449130,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102365.155, "dur": 0.264, + "args": { + "External id": 449131,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102366.452, "dur": 0.580, + "args": { + "External id": 449132,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102368.479, "dur": 1.268, + "args": { + "External id": 449133,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102370.947, "dur": 0.393, + "args": { + "External id": 449134,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008102372.619, "dur": 0.559, + "args": { + "External id": 449135,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008102387.232, "dur": 17.686, + "args": { + "External id": 449136,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008102454.048, "dur": 109.844, + "args": { + "External id": 449137,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008102478.487, "dur": 81.915, + "args": { + "External id": 449138,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2673, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008102487.760, "dur": 68.344, + "args": { + "External id": 449139,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008102578.355, "dur": 1.862, + "args": { + "External id": 449140,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2675, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008102688.083, "dur": 1577.296, + "args": { + "External id": 449141,"Sequence number": 5285414, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2676 + } + }, + { + "ph": "f", "id": 186, "pid": 4183441, "tid": 31362, "ts": 676008102688.083, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008102803.283, "dur": 98.917, + "args": { + "External id": 449142,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008102944.323, "dur": 37.057, + "args": { + "External id": 449143,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008102998.909, "dur": 38.462, + "args": { + "External id": 449144,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103048.374, "dur": 26.739, + "args": { + "External id": 449145,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103081.037, "dur": 54.822, + "args": { + "External id": 449146,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103145.545, "dur": 20.736, + "args": { + "External id": 449147,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103173.828, "dur": 29.921, + "args": { + "External id": 449148,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008103231.511, "dur": 22.997, + "args": { + "External id": 449149,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008103273.189, "dur": 26.136, + "args": { + "External id": 449150,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008103319.300, "dur": 17.715, + "args": { + "External id": 449151,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008103351.199, "dur": 13.728, + "args": { + "External id": 449152,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103373.592, "dur": 35.645, + "args": { + "External id": 449153,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103412.552, "dur": 33.856, + "args": { + "External id": 449154,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008103474.559, "dur": 163.468, + "args": { + "External id": 449155,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008103550.973, "dur": 5.953, + "args": { + "External id": 449156,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008103558.608, "dur": 2.928, + "args": { + "External id": 449157,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008103724.282, "dur": 28.842, + "args": { + "External id": 449158,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008103766.033, "dur": 13.619, + "args": { + "External id": 449159,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103789.336, "dur": 52.673, + "args": { + "External id": 449160,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103847.901, "dur": 32.868, + "args": { + "External id": 449161,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103889.428, "dur": 28.487, + "args": { + "External id": 449162,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103922.453, "dur": 28.434, + "args": { + "External id": 449163,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103956.368, "dur": 28.009, + "args": { + "External id": 449164,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008103991.075, "dur": 41.216, + "args": { + "External id": 449165,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008104058.815, "dur": 41.813, + "args": { + "External id": 449166,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008104121.946, "dur": 29.035, + "args": { + "External id": 449167,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008104165.890, "dur": 16.606, + "args": { + "External id": 449168,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008104195.965, "dur": 15.800, + "args": { + "External id": 449169,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008104223.456, "dur": 14.405, + "args": { + "External id": 449170,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104307.762, "dur": 15.431, + "args": { + "External id": 449171,"Record function id": 0, "Ev Idx": 2706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104311.131, "dur": 11.182, + "args": { + "External id": 449172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104315.149, "dur": 6.359, + "args": { + "External id": 449173,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104316.516, "dur": 4.888, + "args": { + "External id": 449174,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104327.120, "dur": 6.400, + "args": { + "External id": 449175,"Record function id": 0, "Ev Idx": 2710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104328.580, "dur": 4.481, + "args": { + "External id": 449176,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104329.753, "dur": 2.868, + "args": { + "External id": 449177,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104330.235, "dur": 2.222, + "args": { + "External id": 449178,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104337.065, "dur": 4.963, + "args": { + "External id": 449179,"Record function id": 0, "Ev Idx": 2714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104338.409, "dur": 3.198, + "args": { + "External id": 449180,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104339.250, "dur": 1.732, + "args": { + "External id": 449181,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104340.020, "dur": 0.900, + "args": { + "External id": 449182,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104345.274, "dur": 4.843, + "args": { + "External id": 449183,"Record function id": 0, "Ev Idx": 2718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104346.632, "dur": 3.108, + "args": { + "External id": 449184,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104347.519, "dur": 1.707, + "args": { + "External id": 449185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104348.165, "dur": 0.983, + "args": { + "External id": 449186,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104353.213, "dur": 4.629, + "args": { + "External id": 449187,"Record function id": 0, "Ev Idx": 2722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104354.361, "dur": 3.098, + "args": { + "External id": 449188,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104355.446, "dur": 1.503, + "args": { + "External id": 449189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104356.151, "dur": 0.733, + "args": { + "External id": 449190,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104360.968, "dur": 3.536, + "args": { + "External id": 449191,"Record function id": 0, "Ev Idx": 2726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104361.972, "dur": 2.106, + "args": { + "External id": 449192,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104362.612, "dur": 1.027, + "args": { + "External id": 449193,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104363.026, "dur": 0.548, + "args": { + "External id": 449194,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104367.758, "dur": 4.184, + "args": { + "External id": 449195,"Record function id": 0, "Ev Idx": 2730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104369.048, "dur": 2.485, + "args": { + "External id": 449196,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104369.515, "dur": 1.387, + "args": { + "External id": 449197,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104370.239, "dur": 0.598, + "args": { + "External id": 449198,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104375.377, "dur": 4.354, + "args": { + "External id": 449199,"Record function id": 0, "Ev Idx": 2734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104376.573, "dur": 2.746, + "args": { + "External id": 449200,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104377.485, "dur": 1.461, + "args": { + "External id": 449201,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104378.212, "dur": 0.668, + "args": { + "External id": 449202,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104382.882, "dur": 5.918, + "args": { + "External id": 449203,"Record function id": 0, "Ev Idx": 2738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008104384.095, "dur": 4.314, + "args": { + "External id": 449204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008104384.822, "dur": 3.207, + "args": { + "External id": 449205,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008104385.449, "dur": 2.512, + "args": { + "External id": 449206,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008104392.366, "dur": 16127.541, + "args": { + "External id": 449207,"Record function id": 0, "Sequence number": 5285413, "Fwd thread id": 1, "Ev Idx": 2742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008104393.775, "dur": 16117.600, + "args": { + "External id": 449208,"Sequence number": 5285413, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2743 + } + }, + { + "ph": "f", "id": 187, "pid": 4183441, "tid": 31362, "ts": 676008104393.775, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.12)", "pid": 4183441, "tid": 31362, + "ts": 676008104423.369, "dur": 37.495, + "args": { + "External id": 449209,"Record function id": 0, "Ev Idx": 2744 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.12)", "pid": 4183441, "tid": 31362, + "ts": 676008104468.263, "dur": 71.171, + "args": { + "External id": 449210,"Record function id": 0, "Ev Idx": 2745 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.12)", "pid": 4183441, "tid": 31362, + "ts": 676008104546.008, "dur": 15958.572, + "args": { + "External id": 449211,"Record function id": 0, "Ev Idx": 2746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008104633.484, "dur": 6.622, + "args": { + "External id": 449212,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008104649.203, "dur": 4.813, + "args": { + "External id": 449213,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008104705.375, "dur": 15150.006, + "args": { + "External id": 449214,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008104719.189, "dur": 15128.519, + "args": { + "External id": 449215,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008104748.250, "dur": 14.448, + "args": { + "External id": 449216,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008104767.688, "dur": 15046.556, + "args": { + "External id": 449217,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008104770.514, "dur": 15043.031, + "args": { + "External id": 449218,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008104774.856, "dur": 6.751, + "args": { + "External id": 449219,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008104783.414, "dur": 15027.032, + "args": { + "External id": 449220,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008119937.875, "dur": 8.699, + "args": { + "External id": 449221,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008119940.624, "dur": 5.541, + "args": { + "External id": 449222,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008119973.024, "dur": 269.111, + "args": { + "External id": 449223,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008119998.948, "dur": 238.714, + "args": { + "External id": 449224,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2759, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008120011.129, "dur": 221.483, + "args": { + "External id": 449225,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008120259.632, "dur": 2.353, + "args": { + "External id": 449226,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2761, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120313.790, "dur": 5.921, + "args": { + "External id": 449227,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120360.482, "dur": 3.419, + "args": { + "External id": 449228,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120379.614, "dur": 1.301, + "args": { + "External id": 449229,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120392.479, "dur": 0.678, + "args": { + "External id": 449230,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120403.012, "dur": 1.007, + "args": { + "External id": 449231,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120413.773, "dur": 2.593, + "args": { + "External id": 449232,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120426.623, "dur": 0.864, + "args": { + "External id": 449233,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120437.626, "dur": 2.070, + "args": { + "External id": 449234,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120449.322, "dur": 0.759, + "args": { + "External id": 449235,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008120533.850, "dur": 2625.697, + "args": { + "External id": 449236,"Record function id": 0, "Ev Idx": 2771 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.11)", "pid": 4183441, "tid": 31362, + "ts": 676008120552.860, "dur": 973.246, + "args": { + "External id": 449237,"Record function id": 0, "Ev Idx": 2772 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 4183441, "tid": 31362, + "ts": 676008120567.114, "dur": 332.189, + "args": { + "External id": 449238,"Record function id": 0, "Ev Idx": 2773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120645.863, "dur": 5.302, + "args": { + "External id": 449239,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120691.643, "dur": 1.973, + "args": { + "External id": 449240,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120695.639, "dur": 1.000, + "args": { + "External id": 449241,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120698.316, "dur": 1.247, + "args": { + "External id": 449242,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120701.121, "dur": 0.956, + "args": { + "External id": 449243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120705.114, "dur": 0.861, + "args": { + "External id": 449244,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120707.578, "dur": 1.467, + "args": { + "External id": 449245,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120710.501, "dur": 0.858, + "args": { + "External id": 449246,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120712.779, "dur": 2.642, + "args": { + "External id": 449247,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008120716.845, "dur": 0.919, + "args": { + "External id": 449248,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008120735.066, "dur": 136.041, + "args": { + "External id": 449249,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008120751.098, "dur": 115.786, + "args": { + "External id": 449250,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008120763.351, "dur": 12.623, + "args": { + "External id": 449251,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008120778.563, "dur": 61.156, + "args": { + "External id": 449252,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008120781.175, "dur": 58.241, + "args": { + "External id": 449253,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008120785.984, "dur": 5.559, + "args": { + "External id": 449254,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008120793.229, "dur": 45.440, + "args": { + "External id": 449255,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2790 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.10", "pid": 4183441, "tid": 31362, + "ts": 676008120986.057, "dur": 532.651, + "args": { + "External id": 449256,"Record function id": 0, "Ev Idx": 2791 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 4183441, "tid": 31362, + "ts": 676008121003.857, "dur": 503.106, + "args": { + "External id": 449257,"Record function id": 0, "Ev Idx": 2792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008121063.636, "dur": 5.143, + "args": { + "External id": 449258,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008121102.144, "dur": 26.055, + "args": { + "External id": 449259,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121106.132, "dur": 1.799, + "args": { + "External id": 449260,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121109.798, "dur": 0.563, + "args": { + "External id": 449261,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121112.751, "dur": 0.458, + "args": { + "External id": 449262,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121114.299, "dur": 1.972, + "args": { + "External id": 449263,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121116.913, "dur": 0.265, + "args": { + "External id": 449264,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121118.844, "dur": 0.603, + "args": { + "External id": 449265,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121120.390, "dur": 0.481, + "args": { + "External id": 449266,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121121.710, "dur": 1.277, + "args": { + "External id": 449267,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121123.998, "dur": 0.344, + "args": { + "External id": 449268,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008121142.052, "dur": 31.374, + "args": { + "External id": 449269,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008121203.902, "dur": 91.833, + "args": { + "External id": 449270,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008121213.172, "dur": 4.599, + "args": { + "External id": 449271,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008121223.047, "dur": 9.119, + "args": { + "External id": 449272,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008121227.022, "dur": 4.747, + "args": { + "External id": 449273,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121229.874, "dur": 0.600, + "args": { + "External id": 449274,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008121238.815, "dur": 21.855, + "args": { + "External id": 449275,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121240.256, "dur": 2.359, + "args": { + "External id": 449276,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121243.660, "dur": 1.536, + "args": { + "External id": 449277,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121246.036, "dur": 0.388, + "args": { + "External id": 449278,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121247.269, "dur": 0.472, + "args": { + "External id": 449279,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121249.648, "dur": 0.655, + "args": { + "External id": 449280,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121250.948, "dur": 0.527, + "args": { + "External id": 449281,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121252.252, "dur": 0.578, + "args": { + "External id": 449282,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121254.536, "dur": 0.278, + "args": { + "External id": 449283,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008121255.383, "dur": 2.086, + "args": { + "External id": 449284,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008121269.713, "dur": 19.028, + "args": { + "External id": 449285,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008121338.391, "dur": 106.960, + "args": { + "External id": 449286,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008121361.669, "dur": 80.427, + "args": { + "External id": 449287,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2822, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008121371.052, "dur": 67.253, + "args": { + "External id": 449288,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008121459.997, "dur": 1.795, + "args": { + "External id": 449289,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2824, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008121532.304, "dur": 1600.675, + "args": { + "External id": 449290,"Sequence number": 5285412, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2825 + } + }, + { + "ph": "f", "id": 188, "pid": 4183441, "tid": 31362, "ts": 676008121532.304, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008121638.527, "dur": 139.357, + "args": { + "External id": 449291,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008121822.000, "dur": 38.877, + "args": { + "External id": 449292,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008121879.953, "dur": 41.726, + "args": { + "External id": 449293,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008121930.601, "dur": 27.931, + "args": { + "External id": 449294,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008121964.960, "dur": 38.537, + "args": { + "External id": 449295,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122009.406, "dur": 20.295, + "args": { + "External id": 449296,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122038.820, "dur": 30.095, + "args": { + "External id": 449297,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008122110.358, "dur": 24.066, + "args": { + "External id": 449298,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008122151.538, "dur": 26.498, + "args": { + "External id": 449299,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008122198.996, "dur": 17.274, + "args": { + "External id": 449300,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008122228.911, "dur": 15.234, + "args": { + "External id": 449301,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122253.388, "dur": 39.664, + "args": { + "External id": 449302,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122296.401, "dur": 35.135, + "args": { + "External id": 449303,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008122362.163, "dur": 160.960, + "args": { + "External id": 449304,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008122436.635, "dur": 6.020, + "args": { + "External id": 449305,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008122444.519, "dur": 2.996, + "args": { + "External id": 449306,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008122554.182, "dur": 23.518, + "args": { + "External id": 449307,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008122588.622, "dur": 13.254, + "args": { + "External id": 449308,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122609.467, "dur": 40.084, + "args": { + "External id": 449309,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122698.198, "dur": 36.957, + "args": { + "External id": 449310,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122743.409, "dur": 30.846, + "args": { + "External id": 449311,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122778.455, "dur": 28.560, + "args": { + "External id": 449312,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122815.867, "dur": 26.813, + "args": { + "External id": 449313,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008122851.934, "dur": 30.139, + "args": { + "External id": 449314,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008122901.178, "dur": 21.679, + "args": { + "External id": 449315,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008122942.647, "dur": 22.136, + "args": { + "External id": 449316,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008122980.894, "dur": 20.274, + "args": { + "External id": 449317,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008123014.826, "dur": 27.307, + "args": { + "External id": 449318,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008123062.799, "dur": 39.831, + "args": { + "External id": 449319,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 2854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123181.435, "dur": 20.001, + "args": { + "External id": 449320,"Record function id": 0, "Ev Idx": 2855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123184.619, "dur": 16.018, + "args": { + "External id": 449321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123188.851, "dur": 10.900, + "args": { + "External id": 449322,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123190.786, "dur": 8.881, + "args": { + "External id": 449323,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123205.198, "dur": 4.673, + "args": { + "External id": 449324,"Record function id": 0, "Ev Idx": 2859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123206.717, "dur": 2.737, + "args": { + "External id": 449325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123207.738, "dur": 1.256, + "args": { + "External id": 449326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123208.236, "dur": 0.692, + "args": { + "External id": 449327,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123213.061, "dur": 4.903, + "args": { + "External id": 449328,"Record function id": 0, "Ev Idx": 2863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123214.463, "dur": 3.071, + "args": { + "External id": 449329,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123215.400, "dur": 1.689, + "args": { + "External id": 449330,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123216.146, "dur": 0.859, + "args": { + "External id": 449331,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 2866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123221.143, "dur": 4.731, + "args": { + "External id": 449332,"Record function id": 0, "Ev Idx": 2867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123222.427, "dur": 3.032, + "args": { + "External id": 449333,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123223.476, "dur": 1.569, + "args": { + "External id": 449334,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123224.169, "dur": 0.798, + "args": { + "External id": 449335,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 2870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123229.338, "dur": 4.549, + "args": { + "External id": 449336,"Record function id": 0, "Ev Idx": 2871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123230.494, "dur": 2.934, + "args": { + "External id": 449337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123231.370, "dur": 1.638, + "args": { + "External id": 449338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123232.172, "dur": 0.769, + "args": { + "External id": 449339,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123237.054, "dur": 3.891, + "args": { + "External id": 449340,"Record function id": 0, "Ev Idx": 2875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123238.403, "dur": 2.116, + "args": { + "External id": 449341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123238.980, "dur": 1.134, + "args": { + "External id": 449342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123239.340, "dur": 0.677, + "args": { + "External id": 449343,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123244.048, "dur": 4.539, + "args": { + "External id": 449344,"Record function id": 0, "Ev Idx": 2879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123245.624, "dur": 2.531, + "args": { + "External id": 449345,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123246.511, "dur": 1.187, + "args": { + "External id": 449346,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123246.989, "dur": 0.644, + "args": { + "External id": 449347,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123251.797, "dur": 8.770, + "args": { + "External id": 449348,"Record function id": 0, "Ev Idx": 2883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123252.949, "dur": 7.180, + "args": { + "External id": 449349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123253.591, "dur": 6.121, + "args": { + "External id": 449350,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123254.058, "dur": 5.576, + "args": { + "External id": 449351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 2886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123263.907, "dur": 3.988, + "args": { + "External id": 449352,"Record function id": 0, "Ev Idx": 2887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008123264.820, "dur": 2.669, + "args": { + "External id": 449353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008123265.320, "dur": 1.636, + "args": { + "External id": 449354,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008123265.945, "dur": 0.949, + "args": { + "External id": 449355,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 2890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008123271.717, "dur": 14942.990, + "args": { + "External id": 449356,"Record function id": 0, "Sequence number": 5285411, "Fwd thread id": 1, "Ev Idx": 2891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008123272.889, "dur": 14933.044, + "args": { + "External id": 449357,"Sequence number": 5285411, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2892 + } + }, + { + "ph": "f", "id": 189, "pid": 4183441, "tid": 31362, "ts": 676008123272.889, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.11)", "pid": 4183441, "tid": 31362, + "ts": 676008123301.012, "dur": 38.805, + "args": { + "External id": 449358,"Record function id": 0, "Ev Idx": 2893 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.11)", "pid": 4183441, "tid": 31362, + "ts": 676008123346.700, "dur": 68.032, + "args": { + "External id": 449359,"Record function id": 0, "Ev Idx": 2894 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.11)", "pid": 4183441, "tid": 31362, + "ts": 676008123420.931, "dur": 14776.899, + "args": { + "External id": 449360,"Record function id": 0, "Ev Idx": 2895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008123509.921, "dur": 7.160, + "args": { + "External id": 449361,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008123526.050, "dur": 4.468, + "args": { + "External id": 449362,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008123543.552, "dur": 13960.475, + "args": { + "External id": 449363,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008123556.266, "dur": 13938.067, + "args": { + "External id": 449364,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 2899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008123575.760, "dur": 12.915, + "args": { + "External id": 449365,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008123593.163, "dur": 13864.697, + "args": { + "External id": 449366,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 2901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008123595.461, "dur": 13861.638, + "args": { + "External id": 449367,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 2902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008123599.011, "dur": 6.493, + "args": { + "External id": 449368,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008123607.262, "dur": 13846.146, + "args": { + "External id": 449369,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 2904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008137593.348, "dur": 9.885, + "args": { + "External id": 449370,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 2905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008137596.408, "dur": 6.487, + "args": { + "External id": 449371,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008137629.916, "dur": 279.777, + "args": { + "External id": 449372,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 2907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008137680.914, "dur": 223.852, + "args": { + "External id": 449373,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2908, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008137694.043, "dur": 205.697, + "args": { + "External id": 449374,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 2909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008137926.295, "dur": 2.362, + "args": { + "External id": 449375,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2910, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008137979.935, "dur": 6.656, + "args": { + "External id": 449376,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138029.312, "dur": 1.373, + "args": { + "External id": 449377,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138045.774, "dur": 1.347, + "args": { + "External id": 449378,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138058.159, "dur": 0.865, + "args": { + "External id": 449379,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138070.010, "dur": 0.833, + "args": { + "External id": 449380,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138098.022, "dur": 1.389, + "args": { + "External id": 449381,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138113.964, "dur": 0.821, + "args": { + "External id": 449382,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138125.360, "dur": 2.444, + "args": { + "External id": 449383,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138137.632, "dur": 1.234, + "args": { + "External id": 449384,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008138229.617, "dur": 2628.900, + "args": { + "External id": 449385,"Record function id": 0, "Ev Idx": 2920 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.10)", "pid": 4183441, "tid": 31362, + "ts": 676008138247.710, "dur": 989.148, + "args": { + "External id": 449386,"Record function id": 0, "Ev Idx": 2921 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 4183441, "tid": 31362, + "ts": 676008138261.114, "dur": 284.469, + "args": { + "External id": 449387,"Record function id": 0, "Ev Idx": 2922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138340.572, "dur": 3.762, + "args": { + "External id": 449388,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 2923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138347.602, "dur": 1.029, + "args": { + "External id": 449389,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138350.312, "dur": 0.973, + "args": { + "External id": 449390,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138353.299, "dur": 0.733, + "args": { + "External id": 449391,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138355.231, "dur": 1.276, + "args": { + "External id": 449392,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138357.816, "dur": 0.993, + "args": { + "External id": 449393,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 2928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138360.460, "dur": 1.414, + "args": { + "External id": 449394,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 2929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138363.433, "dur": 2.192, + "args": { + "External id": 449395,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138367.130, "dur": 0.933, + "args": { + "External id": 449396,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008138369.729, "dur": 0.650, + "args": { + "External id": 449397,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 2932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008138387.465, "dur": 133.795, + "args": { + "External id": 449398,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008138402.140, "dur": 114.814, + "args": { + "External id": 449399,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 2934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008138414.572, "dur": 11.977, + "args": { + "External id": 449400,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008138429.390, "dur": 60.949, + "args": { + "External id": 449401,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 2936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008138432.188, "dur": 57.811, + "args": { + "External id": 449402,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 2937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138437.052, "dur": 6.114, + "args": { + "External id": 449403,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008138444.853, "dur": 44.642, + "args": { + "External id": 449404,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 2939 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.9", "pid": 4183441, "tid": 31362, + "ts": 676008138626.966, "dur": 602.677, + "args": { + "External id": 449405,"Record function id": 0, "Ev Idx": 2940 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 4183441, "tid": 31362, + "ts": 676008138642.421, "dur": 575.653, + "args": { + "External id": 449406,"Record function id": 0, "Ev Idx": 2941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008138743.929, "dur": 7.289, + "args": { + "External id": 449407,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008138765.351, "dur": 30.591, + "args": { + "External id": 449408,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138769.785, "dur": 1.462, + "args": { + "External id": 449409,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138773.063, "dur": 1.689, + "args": { + "External id": 449410,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138776.320, "dur": 2.339, + "args": { + "External id": 449411,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138779.444, "dur": 0.478, + "args": { + "External id": 449412,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138782.194, "dur": 0.335, + "args": { + "External id": 449413,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138784.041, "dur": 0.455, + "args": { + "External id": 449414,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138787.463, "dur": 0.561, + "args": { + "External id": 449415,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138789.863, "dur": 0.378, + "args": { + "External id": 449416,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138791.043, "dur": 0.570, + "args": { + "External id": 449417,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008138805.608, "dur": 33.168, + "args": { + "External id": 449418,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008138872.857, "dur": 106.262, + "args": { + "External id": 449419,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 2954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008138882.234, "dur": 5.016, + "args": { + "External id": 449420,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008138892.133, "dur": 11.779, + "args": { + "External id": 449421,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008138896.494, "dur": 7.005, + "args": { + "External id": 449422,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 2957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138899.798, "dur": 2.436, + "args": { + "External id": 449423,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 2958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008138910.541, "dur": 28.039, + "args": { + "External id": 449424,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 2959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138912.469, "dur": 0.561, + "args": { + "External id": 449425,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138914.708, "dur": 1.501, + "args": { + "External id": 449426,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138917.297, "dur": 0.430, + "args": { + "External id": 449427,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138922.209, "dur": 0.572, + "args": { + "External id": 449428,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138924.615, "dur": 0.356, + "args": { + "External id": 449429,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138926.378, "dur": 0.461, + "args": { + "External id": 449430,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138928.105, "dur": 0.480, + "args": { + "External id": 449431,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138930.697, "dur": 2.590, + "args": { + "External id": 449432,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008138934.405, "dur": 0.802, + "args": { + "External id": 449433,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 2968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008138951.986, "dur": 19.708, + "args": { + "External id": 449434,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 2969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008139022.539, "dur": 125.635, + "args": { + "External id": 449435,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 2970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008139044.025, "dur": 100.009, + "args": { + "External id": 449436,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2971, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008139053.575, "dur": 85.884, + "args": { + "External id": 449437,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 2972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008139164.161, "dur": 2.085, + "args": { + "External id": 449438,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2973, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008139244.270, "dur": 1593.107, + "args": { + "External id": 449439,"Sequence number": 5285410, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 2974 + } + }, + { + "ph": "f", "id": 190, "pid": 4183441, "tid": 31362, "ts": 676008139244.270, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008139353.416, "dur": 97.571, + "args": { + "External id": 449440,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 2975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008139487.378, "dur": 40.290, + "args": { + "External id": 449441,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 2976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008139546.632, "dur": 41.777, + "args": { + "External id": 449442,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 2977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008139597.347, "dur": 28.133, + "args": { + "External id": 449443,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008139631.724, "dur": 73.879, + "args": { + "External id": 449444,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008139716.372, "dur": 23.862, + "args": { + "External id": 449445,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 2980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008139749.449, "dur": 30.350, + "args": { + "External id": 449446,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 2981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008139805.798, "dur": 24.484, + "args": { + "External id": 449447,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 2982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008139849.513, "dur": 24.867, + "args": { + "External id": 449448,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008139893.367, "dur": 17.757, + "args": { + "External id": 449449,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 2984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008139923.595, "dur": 13.120, + "args": { + "External id": 449450,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 2985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008139946.855, "dur": 38.322, + "args": { + "External id": 449451,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008139988.499, "dur": 32.493, + "args": { + "External id": 449452,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008140047.438, "dur": 184.115, + "args": { + "External id": 449453,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008140138.455, "dur": 6.493, + "args": { + "External id": 449454,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008140147.302, "dur": 4.412, + "args": { + "External id": 449455,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008140264.754, "dur": 24.168, + "args": { + "External id": 449456,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008140300.189, "dur": 13.247, + "args": { + "External id": 449457,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008140322.879, "dur": 51.212, + "args": { + "External id": 449458,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008140379.362, "dur": 31.567, + "args": { + "External id": 449459,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008140420.945, "dur": 27.829, + "args": { + "External id": 449460,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008140453.210, "dur": 28.602, + "args": { + "External id": 449461,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008140489.227, "dur": 27.616, + "args": { + "External id": 449462,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 2997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008140523.764, "dur": 28.462, + "args": { + "External id": 449463,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 2998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008140568.129, "dur": 22.092, + "args": { + "External id": 449464,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 2999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008140608.319, "dur": 77.255, + "args": { + "External id": 449465,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008140719.578, "dur": 20.771, + "args": { + "External id": 449466,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008140757.008, "dur": 17.246, + "args": { + "External id": 449467,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008140787.127, "dur": 15.748, + "args": { + "External id": 449468,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140880.091, "dur": 17.846, + "args": { + "External id": 449469,"Record function id": 0, "Ev Idx": 3004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140886.729, "dur": 10.350, + "args": { + "External id": 449470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140891.181, "dur": 5.076, + "args": { + "External id": 449471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140892.374, "dur": 3.796, + "args": { + "External id": 449472,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140901.860, "dur": 5.301, + "args": { + "External id": 449473,"Record function id": 0, "Ev Idx": 3008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140903.576, "dur": 3.158, + "args": { + "External id": 449474,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140904.552, "dur": 1.707, + "args": { + "External id": 449475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140905.234, "dur": 0.932, + "args": { + "External id": 449476,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140910.548, "dur": 4.480, + "args": { + "External id": 449477,"Record function id": 0, "Ev Idx": 3012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140912.002, "dur": 2.628, + "args": { + "External id": 449478,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140912.689, "dur": 1.401, + "args": { + "External id": 449479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140913.167, "dur": 0.820, + "args": { + "External id": 449480,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140918.095, "dur": 4.088, + "args": { + "External id": 449481,"Record function id": 0, "Ev Idx": 3016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140919.548, "dur": 2.192, + "args": { + "External id": 449482,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140920.047, "dur": 1.311, + "args": { + "External id": 449483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140920.646, "dur": 0.621, + "args": { + "External id": 449484,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140925.157, "dur": 4.010, + "args": { + "External id": 449485,"Record function id": 0, "Ev Idx": 3020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140926.410, "dur": 2.363, + "args": { + "External id": 449486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140926.851, "dur": 1.395, + "args": { + "External id": 449487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140927.548, "dur": 0.606, + "args": { + "External id": 449488,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140932.397, "dur": 4.492, + "args": { + "External id": 449489,"Record function id": 0, "Ev Idx": 3024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140933.427, "dur": 3.044, + "args": { + "External id": 449490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140934.086, "dur": 1.862, + "args": { + "External id": 449491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140934.875, "dur": 0.981, + "args": { + "External id": 449492,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140942.893, "dur": 5.839, + "args": { + "External id": 449493,"Record function id": 0, "Ev Idx": 3028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140943.956, "dur": 4.353, + "args": { + "External id": 449494,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140944.608, "dur": 3.319, + "args": { + "External id": 449495,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140945.485, "dur": 2.372, + "args": { + "External id": 449496,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140951.938, "dur": 4.646, + "args": { + "External id": 449497,"Record function id": 0, "Ev Idx": 3032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140953.241, "dur": 2.935, + "args": { + "External id": 449498,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140953.708, "dur": 2.083, + "args": { + "External id": 449499,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140954.521, "dur": 1.180, + "args": { + "External id": 449500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140959.895, "dur": 4.199, + "args": { + "External id": 449501,"Record function id": 0, "Ev Idx": 3036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008140961.168, "dur": 2.518, + "args": { + "External id": 449502,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008140962.005, "dur": 1.265, + "args": { + "External id": 449503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008140962.536, "dur": 0.642, + "args": { + "External id": 449504,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008140968.345, "dur": 15061.807, + "args": { + "External id": 449505,"Record function id": 0, "Sequence number": 5285409, "Fwd thread id": 1, "Ev Idx": 3040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008140969.515, "dur": 15052.514, + "args": { + "External id": 449506,"Sequence number": 5285409, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3041 + } + }, + { + "ph": "f", "id": 191, "pid": 4183441, "tid": 31362, "ts": 676008140969.515, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.10)", "pid": 4183441, "tid": 31362, + "ts": 676008141000.823, "dur": 37.810, + "args": { + "External id": 449507,"Record function id": 0, "Ev Idx": 3042 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.10)", "pid": 4183441, "tid": 31362, + "ts": 676008141046.165, "dur": 92.976, + "args": { + "External id": 449508,"Record function id": 0, "Ev Idx": 3043 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.10)", "pid": 4183441, "tid": 31362, + "ts": 676008141146.274, "dur": 14868.339, + "args": { + "External id": 449509,"Record function id": 0, "Ev Idx": 3044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008141239.905, "dur": 6.595, + "args": { + "External id": 449510,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008141257.203, "dur": 4.740, + "args": { + "External id": 449511,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008141275.087, "dur": 14011.581, + "args": { + "External id": 449512,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008141295.995, "dur": 13982.936, + "args": { + "External id": 449513,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008141323.271, "dur": 13.835, + "args": { + "External id": 449514,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008141341.829, "dur": 13899.912, + "args": { + "External id": 449515,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008141344.314, "dur": 13896.696, + "args": { + "External id": 449516,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008141348.044, "dur": 5.491, + "args": { + "External id": 449517,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008141355.134, "dur": 13882.576, + "args": { + "External id": 449518,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008155371.065, "dur": 9.024, + "args": { + "External id": 449519,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008155373.977, "dur": 5.654, + "args": { + "External id": 449520,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008155406.064, "dur": 329.971, + "args": { + "External id": 449521,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008155435.658, "dur": 295.434, + "args": { + "External id": 449522,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3057, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008155448.307, "dur": 277.417, + "args": { + "External id": 449523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008155755.143, "dur": 2.283, + "args": { + "External id": 449524,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3059, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155813.654, "dur": 8.524, + "args": { + "External id": 449525,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155864.004, "dur": 1.487, + "args": { + "External id": 449526,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155881.223, "dur": 1.555, + "args": { + "External id": 449527,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155894.546, "dur": 1.289, + "args": { + "External id": 449528,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155906.666, "dur": 2.761, + "args": { + "External id": 449529,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155919.380, "dur": 0.860, + "args": { + "External id": 449530,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155930.756, "dur": 0.752, + "args": { + "External id": 449531,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155942.566, "dur": 1.669, + "args": { + "External id": 449532,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008155953.990, "dur": 2.678, + "args": { + "External id": 449533,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008156043.754, "dur": 2669.085, + "args": { + "External id": 449534,"Record function id": 0, "Ev Idx": 3069 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.9)", "pid": 4183441, "tid": 31362, + "ts": 676008156062.381, "dur": 1012.479, + "args": { + "External id": 449535,"Record function id": 0, "Ev Idx": 3070 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 4183441, "tid": 31362, + "ts": 676008156075.924, "dur": 333.540, + "args": { + "External id": 449536,"Record function id": 0, "Ev Idx": 3071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156192.963, "dur": 4.809, + "args": { + "External id": 449537,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156200.909, "dur": 3.992, + "args": { + "External id": 449538,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156206.486, "dur": 0.923, + "args": { + "External id": 449539,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156208.766, "dur": 0.757, + "args": { + "External id": 449540,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156210.855, "dur": 0.772, + "args": { + "External id": 449541,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156213.022, "dur": 0.846, + "args": { + "External id": 449542,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156215.345, "dur": 3.530, + "args": { + "External id": 449543,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156220.658, "dur": 0.880, + "args": { + "External id": 449544,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156223.193, "dur": 0.670, + "args": { + "External id": 449545,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008156225.876, "dur": 0.639, + "args": { + "External id": 449546,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008156243.848, "dur": 136.831, + "args": { + "External id": 449547,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008156258.507, "dur": 118.242, + "args": { + "External id": 449548,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008156271.992, "dur": 13.292, + "args": { + "External id": 449549,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008156288.071, "dur": 60.896, + "args": { + "External id": 449550,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008156290.634, "dur": 58.022, + "args": { + "External id": 449551,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156294.201, "dur": 5.732, + "args": { + "External id": 449552,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008156301.514, "dur": 46.606, + "args": { + "External id": 449553,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3088 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.8", "pid": 4183441, "tid": 31362, + "ts": 676008156497.969, "dur": 569.324, + "args": { + "External id": 449554,"Record function id": 0, "Ev Idx": 3089 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 4183441, "tid": 31362, + "ts": 676008156514.849, "dur": 540.207, + "args": { + "External id": 449555,"Record function id": 0, "Ev Idx": 3090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008156576.555, "dur": 4.249, + "args": { + "External id": 449556,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008156594.423, "dur": 26.521, + "args": { + "External id": 449557,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156599.497, "dur": 1.486, + "args": { + "External id": 449558,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156602.546, "dur": 2.498, + "args": { + "External id": 449559,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156606.564, "dur": 0.433, + "args": { + "External id": 449560,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156608.189, "dur": 0.321, + "args": { + "External id": 449561,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156610.941, "dur": 0.363, + "args": { + "External id": 449562,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156612.055, "dur": 0.284, + "args": { + "External id": 449563,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156613.556, "dur": 0.252, + "args": { + "External id": 449564,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156615.844, "dur": 0.248, + "args": { + "External id": 449565,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156617.166, "dur": 0.259, + "args": { + "External id": 449566,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008156630.484, "dur": 68.941, + "args": { + "External id": 449567,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008156733.220, "dur": 103.466, + "args": { + "External id": 449568,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008156743.430, "dur": 6.059, + "args": { + "External id": 449569,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008156754.413, "dur": 9.936, + "args": { + "External id": 449570,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008156758.458, "dur": 5.496, + "args": { + "External id": 449571,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156761.892, "dur": 0.625, + "args": { + "External id": 449572,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008156771.525, "dur": 23.512, + "args": { + "External id": 449573,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156773.124, "dur": 0.666, + "args": { + "External id": 449574,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156776.533, "dur": 0.496, + "args": { + "External id": 449575,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156777.967, "dur": 0.701, + "args": { + "External id": 449576,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156780.152, "dur": 1.415, + "args": { + "External id": 449577,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156782.522, "dur": 0.258, + "args": { + "External id": 449578,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156784.180, "dur": 0.336, + "args": { + "External id": 449579,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156787.314, "dur": 1.995, + "args": { + "External id": 449580,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156790.501, "dur": 0.383, + "args": { + "External id": 449581,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008156791.887, "dur": 0.326, + "args": { + "External id": 449582,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008156807.690, "dur": 21.898, + "args": { + "External id": 449583,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008156881.890, "dur": 109.908, + "args": { + "External id": 449584,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008156905.263, "dur": 83.113, + "args": { + "External id": 449585,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3120, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008156915.944, "dur": 68.233, + "args": { + "External id": 449586,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008157006.312, "dur": 1.749, + "args": { + "External id": 449587,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3122, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008157097.649, "dur": 1594.651, + "args": { + "External id": 449588,"Sequence number": 5285408, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3123 + } + }, + { + "ph": "f", "id": 192, "pid": 4183441, "tid": 31362, "ts": 676008157097.649, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008157209.112, "dur": 100.590, + "args": { + "External id": 449589,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008157347.403, "dur": 36.399, + "args": { + "External id": 449590,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008157401.073, "dur": 39.425, + "args": { + "External id": 449591,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008157449.565, "dur": 26.787, + "args": { + "External id": 449592,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008157481.873, "dur": 33.581, + "args": { + "External id": 449593,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008157523.114, "dur": 20.092, + "args": { + "External id": 449594,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008157550.712, "dur": 29.429, + "args": { + "External id": 449595,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008157602.052, "dur": 22.078, + "args": { + "External id": 449596,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008157641.202, "dur": 67.893, + "args": { + "External id": 449597,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008157733.195, "dur": 20.910, + "args": { + "External id": 449598,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008157765.579, "dur": 14.720, + "args": { + "External id": 449599,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008157790.986, "dur": 42.467, + "args": { + "External id": 449600,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008157837.215, "dur": 31.095, + "args": { + "External id": 449601,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008157895.535, "dur": 171.584, + "args": { + "External id": 449602,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008157970.121, "dur": 6.066, + "args": { + "External id": 449603,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008157978.054, "dur": 9.186, + "args": { + "External id": 449604,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008158119.904, "dur": 29.960, + "args": { + "External id": 449605,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008158165.683, "dur": 15.982, + "args": { + "External id": 449606,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008158190.262, "dur": 51.010, + "args": { + "External id": 449607,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008158246.784, "dur": 32.664, + "args": { + "External id": 449608,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008158286.040, "dur": 32.333, + "args": { + "External id": 449609,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008158324.340, "dur": 28.835, + "args": { + "External id": 449610,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008158359.162, "dur": 30.416, + "args": { + "External id": 449611,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008158396.308, "dur": 31.177, + "args": { + "External id": 449612,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008158458.229, "dur": 27.347, + "args": { + "External id": 449613,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008158503.978, "dur": 25.733, + "args": { + "External id": 449614,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008158544.169, "dur": 20.373, + "args": { + "External id": 449615,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008158580.826, "dur": 15.701, + "args": { + "External id": 449616,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008158613.337, "dur": 16.088, + "args": { + "External id": 449617,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158734.677, "dur": 17.957, + "args": { + "External id": 449618,"Record function id": 0, "Ev Idx": 3153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158741.233, "dur": 10.559, + "args": { + "External id": 449619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158745.196, "dur": 5.720, + "args": { + "External id": 449620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158746.686, "dur": 4.117, + "args": { + "External id": 449621,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158756.438, "dur": 4.713, + "args": { + "External id": 449622,"Record function id": 0, "Ev Idx": 3157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158757.849, "dur": 2.872, + "args": { + "External id": 449623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158758.843, "dur": 1.380, + "args": { + "External id": 449624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158759.281, "dur": 0.877, + "args": { + "External id": 449625,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158764.342, "dur": 3.770, + "args": { + "External id": 449626,"Record function id": 0, "Ev Idx": 3161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158765.277, "dur": 2.441, + "args": { + "External id": 449627,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158765.876, "dur": 1.390, + "args": { + "External id": 449628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158766.308, "dur": 0.874, + "args": { + "External id": 449629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158771.168, "dur": 5.649, + "args": { + "External id": 449630,"Record function id": 0, "Ev Idx": 3165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158772.190, "dur": 4.250, + "args": { + "External id": 449631,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158772.801, "dur": 3.233, + "args": { + "External id": 449632,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158773.610, "dur": 2.357, + "args": { + "External id": 449633,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158779.914, "dur": 4.310, + "args": { + "External id": 449634,"Record function id": 0, "Ev Idx": 3169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158781.323, "dur": 2.520, + "args": { + "External id": 449635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158781.932, "dur": 1.510, + "args": { + "External id": 449636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158782.555, "dur": 0.820, + "args": { + "External id": 449637,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158787.307, "dur": 4.022, + "args": { + "External id": 449638,"Record function id": 0, "Ev Idx": 3173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158788.678, "dur": 2.256, + "args": { + "External id": 449639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158789.114, "dur": 1.383, + "args": { + "External id": 449640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158789.817, "dur": 0.616, + "args": { + "External id": 449641,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158797.649, "dur": 3.607, + "args": { + "External id": 449642,"Record function id": 0, "Ev Idx": 3177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158798.780, "dur": 2.085, + "args": { + "External id": 449643,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158799.230, "dur": 1.203, + "args": { + "External id": 449644,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158799.811, "dur": 0.557, + "args": { + "External id": 449645,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158804.327, "dur": 3.744, + "args": { + "External id": 449646,"Record function id": 0, "Ev Idx": 3181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158805.472, "dur": 2.225, + "args": { + "External id": 449647,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158805.969, "dur": 1.317, + "args": { + "External id": 449648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158806.539, "dur": 0.681, + "args": { + "External id": 449649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158811.213, "dur": 3.401, + "args": { + "External id": 449650,"Record function id": 0, "Ev Idx": 3185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008158812.100, "dur": 2.145, + "args": { + "External id": 449651,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008158812.568, "dur": 1.245, + "args": { + "External id": 449652,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008158813.081, "dur": 0.667, + "args": { + "External id": 449653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008158818.458, "dur": 14692.972, + "args": { + "External id": 449654,"Record function id": 0, "Sequence number": 5285407, "Fwd thread id": 1, "Ev Idx": 3189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008158819.966, "dur": 14683.237, + "args": { + "External id": 449655,"Sequence number": 5285407, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3190 + } + }, + { + "ph": "f", "id": 193, "pid": 4183441, "tid": 31362, "ts": 676008158819.966, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.9)", "pid": 4183441, "tid": 31362, + "ts": 676008158849.338, "dur": 40.252, + "args": { + "External id": 449656,"Record function id": 0, "Ev Idx": 3191 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.9)", "pid": 4183441, "tid": 31362, + "ts": 676008158896.901, "dur": 76.725, + "args": { + "External id": 449657,"Record function id": 0, "Ev Idx": 3192 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.9)", "pid": 4183441, "tid": 31362, + "ts": 676008158980.034, "dur": 14515.782, + "args": { + "External id": 449658,"Record function id": 0, "Ev Idx": 3193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008159064.084, "dur": 6.386, + "args": { + "External id": 449659,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008159079.590, "dur": 19.966, + "args": { + "External id": 449660,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008159116.165, "dur": 13747.321, + "args": { + "External id": 449661,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008159129.948, "dur": 13725.782, + "args": { + "External id": 449662,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008159153.363, "dur": 15.996, + "args": { + "External id": 449663,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008159173.880, "dur": 13647.791, + "args": { + "External id": 449664,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008159176.197, "dur": 13644.791, + "args": { + "External id": 449665,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008159180.272, "dur": 4.908, + "args": { + "External id": 449666,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008159186.682, "dur": 13630.858, + "args": { + "External id": 449667,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008172944.337, "dur": 8.721, + "args": { + "External id": 449668,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008172947.161, "dur": 5.546, + "args": { + "External id": 449669,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008172979.666, "dur": 254.586, + "args": { + "External id": 449670,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008173005.412, "dur": 224.241, + "args": { + "External id": 449671,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3206, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008173017.494, "dur": 207.094, + "args": { + "External id": 449672,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008173251.675, "dur": 2.195, + "args": { + "External id": 449673,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3208, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173304.374, "dur": 6.020, + "args": { + "External id": 449674,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173350.818, "dur": 1.414, + "args": { + "External id": 449675,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173366.630, "dur": 1.297, + "args": { + "External id": 449676,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173381.360, "dur": 0.820, + "args": { + "External id": 449677,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173392.763, "dur": 0.941, + "args": { + "External id": 449678,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173402.850, "dur": 0.717, + "args": { + "External id": 449679,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173413.312, "dur": 1.079, + "args": { + "External id": 449680,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173427.549, "dur": 1.858, + "args": { + "External id": 449681,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173438.699, "dur": 1.000, + "args": { + "External id": 449682,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008173525.363, "dur": 2607.208, + "args": { + "External id": 449683,"Record function id": 0, "Ev Idx": 3218 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.8)", "pid": 4183441, "tid": 31362, + "ts": 676008173543.648, "dur": 961.885, + "args": { + "External id": 449684,"Record function id": 0, "Ev Idx": 3219 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 4183441, "tid": 31362, + "ts": 676008173556.694, "dur": 328.787, + "args": { + "External id": 449685,"Record function id": 0, "Ev Idx": 3220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173635.895, "dur": 3.974, + "args": { + "External id": 449686,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173642.867, "dur": 0.982, + "args": { + "External id": 449687,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173645.988, "dur": 1.101, + "args": { + "External id": 449688,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173648.587, "dur": 3.049, + "args": { + "External id": 449689,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173688.682, "dur": 1.505, + "args": { + "External id": 449690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173692.432, "dur": 0.748, + "args": { + "External id": 449691,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173694.891, "dur": 1.652, + "args": { + "External id": 449692,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173698.064, "dur": 0.929, + "args": { + "External id": 449693,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173700.734, "dur": 0.819, + "args": { + "External id": 449694,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008173702.849, "dur": 1.069, + "args": { + "External id": 449695,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008173721.400, "dur": 136.730, + "args": { + "External id": 449696,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008173737.573, "dur": 116.747, + "args": { + "External id": 449697,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008173750.244, "dur": 13.213, + "args": { + "External id": 449698,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008173766.394, "dur": 61.019, + "args": { + "External id": 449699,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008173768.898, "dur": 58.134, + "args": { + "External id": 449700,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008173772.657, "dur": 7.462, + "args": { + "External id": 449701,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008173781.835, "dur": 44.634, + "args": { + "External id": 449702,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3237 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.7", "pid": 4183441, "tid": 31362, + "ts": 676008173970.129, "dur": 527.743, + "args": { + "External id": 449703,"Record function id": 0, "Ev Idx": 3238 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 4183441, "tid": 31362, + "ts": 676008173987.095, "dur": 499.321, + "args": { + "External id": 449704,"Record function id": 0, "Ev Idx": 3239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008174045.729, "dur": 3.795, + "args": { + "External id": 449705,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008174064.076, "dur": 47.555, + "args": { + "External id": 449706,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174072.144, "dur": 1.826, + "args": { + "External id": 449707,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174075.528, "dur": 0.354, + "args": { + "External id": 449708,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174077.055, "dur": 0.533, + "args": { + "External id": 449709,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174079.756, "dur": 0.411, + "args": { + "External id": 449710,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174095.870, "dur": 0.668, + "args": { + "External id": 449711,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174098.475, "dur": 0.622, + "args": { + "External id": 449712,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174101.876, "dur": 2.113, + "args": { + "External id": 449713,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174105.095, "dur": 0.364, + "args": { + "External id": 449714,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174106.753, "dur": 0.882, + "args": { + "External id": 449715,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008174122.661, "dur": 35.236, + "args": { + "External id": 449716,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008174189.904, "dur": 93.127, + "args": { + "External id": 449717,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008174199.559, "dur": 3.989, + "args": { + "External id": 449718,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008174209.283, "dur": 9.410, + "args": { + "External id": 449719,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008174213.454, "dur": 4.851, + "args": { + "External id": 449720,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174216.505, "dur": 0.567, + "args": { + "External id": 449721,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008174225.320, "dur": 20.498, + "args": { + "External id": 449722,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174227.291, "dur": 0.425, + "args": { + "External id": 449723,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174229.170, "dur": 0.368, + "args": { + "External id": 449724,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174230.620, "dur": 1.097, + "args": { + "External id": 449725,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174232.610, "dur": 2.516, + "args": { + "External id": 449726,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174235.913, "dur": 0.343, + "args": { + "External id": 449727,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174238.153, "dur": 0.387, + "args": { + "External id": 449728,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174239.266, "dur": 0.523, + "args": { + "External id": 449729,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174241.000, "dur": 0.367, + "args": { + "External id": 449730,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008174242.463, "dur": 0.330, + "args": { + "External id": 449731,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008174256.074, "dur": 19.865, + "args": { + "External id": 449732,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008174326.711, "dur": 100.510, + "args": { + "External id": 449733,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008174346.281, "dur": 77.602, + "args": { + "External id": 449734,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3269, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008174355.327, "dur": 64.765, + "args": { + "External id": 449735,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008174440.224, "dur": 1.621, + "args": { + "External id": 449736,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3271, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008174512.352, "dur": 1597.289, + "args": { + "External id": 449737,"Sequence number": 5285406, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3272 + } + }, + { + "ph": "f", "id": 194, "pid": 4183441, "tid": 31362, "ts": 676008174512.352, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008174621.751, "dur": 140.226, + "args": { + "External id": 449738,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008174803.373, "dur": 37.560, + "args": { + "External id": 449739,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008174858.639, "dur": 44.527, + "args": { + "External id": 449740,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008174912.201, "dur": 28.158, + "args": { + "External id": 449741,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008174948.225, "dur": 34.054, + "args": { + "External id": 449742,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008174992.650, "dur": 23.096, + "args": { + "External id": 449743,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175022.248, "dur": 29.778, + "args": { + "External id": 449744,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008175073.715, "dur": 38.928, + "args": { + "External id": 449745,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008175133.650, "dur": 26.973, + "args": { + "External id": 449746,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008175178.236, "dur": 19.323, + "args": { + "External id": 449747,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008175208.299, "dur": 14.854, + "args": { + "External id": 449748,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175230.539, "dur": 40.391, + "args": { + "External id": 449749,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175274.406, "dur": 30.396, + "args": { + "External id": 449750,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008175334.191, "dur": 172.380, + "args": { + "External id": 449751,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008175417.386, "dur": 5.699, + "args": { + "External id": 449752,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008175425.027, "dur": 2.136, + "args": { + "External id": 449753,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008175537.992, "dur": 24.805, + "args": { + "External id": 449754,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008175573.343, "dur": 14.000, + "args": { + "External id": 449755,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175594.448, "dur": 41.809, + "args": { + "External id": 449756,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175641.843, "dur": 70.898, + "args": { + "External id": 449757,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175725.087, "dur": 31.279, + "args": { + "External id": 449758,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175763.699, "dur": 28.209, + "args": { + "External id": 449759,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175797.900, "dur": 30.255, + "args": { + "External id": 449760,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008175834.689, "dur": 29.436, + "args": { + "External id": 449761,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008175884.265, "dur": 24.001, + "args": { + "External id": 449762,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008175924.199, "dur": 37.852, + "args": { + "External id": 449763,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008175981.249, "dur": 23.615, + "args": { + "External id": 449764,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008176019.582, "dur": 15.394, + "args": { + "External id": 449765,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008176045.651, "dur": 18.924, + "args": { + "External id": 449766,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176155.543, "dur": 17.358, + "args": { + "External id": 449767,"Record function id": 0, "Ev Idx": 3302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176158.719, "dur": 13.264, + "args": { + "External id": 449768,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176162.695, "dur": 8.394, + "args": { + "External id": 449769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176163.864, "dur": 7.130, + "args": { + "External id": 449770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176176.665, "dur": 4.272, + "args": { + "External id": 449771,"Record function id": 0, "Ev Idx": 3306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176177.943, "dur": 2.557, + "args": { + "External id": 449772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176178.608, "dur": 1.350, + "args": { + "External id": 449773,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176179.192, "dur": 0.700, + "args": { + "External id": 449774,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176184.303, "dur": 5.964, + "args": { + "External id": 449775,"Record function id": 0, "Ev Idx": 3310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176185.447, "dur": 4.427, + "args": { + "External id": 449776,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176186.158, "dur": 3.318, + "args": { + "External id": 449777,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176186.664, "dur": 2.742, + "args": { + "External id": 449778,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176193.406, "dur": 4.088, + "args": { + "External id": 449779,"Record function id": 0, "Ev Idx": 3314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176194.581, "dur": 2.526, + "args": { + "External id": 449780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176195.248, "dur": 1.420, + "args": { + "External id": 449781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176195.679, "dur": 0.895, + "args": { + "External id": 449782,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176200.468, "dur": 4.191, + "args": { + "External id": 449783,"Record function id": 0, "Ev Idx": 3318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176201.510, "dur": 2.764, + "args": { + "External id": 449784,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176202.530, "dur": 1.344, + "args": { + "External id": 449785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176203.077, "dur": 0.621, + "args": { + "External id": 449786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176207.906, "dur": 4.099, + "args": { + "External id": 449787,"Record function id": 0, "Ev Idx": 3322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176209.123, "dur": 2.501, + "args": { + "External id": 449788,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176209.786, "dur": 1.308, + "args": { + "External id": 449789,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176210.377, "dur": 0.624, + "args": { + "External id": 449790,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176215.353, "dur": 3.237, + "args": { + "External id": 449791,"Record function id": 0, "Ev Idx": 3326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176216.320, "dur": 1.863, + "args": { + "External id": 449792,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176216.810, "dur": 0.969, + "args": { + "External id": 449793,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176217.148, "dur": 0.565, + "args": { + "External id": 449794,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176221.625, "dur": 3.657, + "args": { + "External id": 449795,"Record function id": 0, "Ev Idx": 3330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176222.698, "dur": 2.139, + "args": { + "External id": 449796,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176223.234, "dur": 1.153, + "args": { + "External id": 449797,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176223.546, "dur": 0.747, + "args": { + "External id": 449798,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176231.328, "dur": 3.611, + "args": { + "External id": 449799,"Record function id": 0, "Ev Idx": 3334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008176232.323, "dur": 2.229, + "args": { + "External id": 449800,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008176232.801, "dur": 1.216, + "args": { + "External id": 449801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008176233.306, "dur": 0.619, + "args": { + "External id": 449802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008176239.041, "dur": 16459.619, + "args": { + "External id": 449803,"Record function id": 0, "Sequence number": 5285405, "Fwd thread id": 1, "Ev Idx": 3338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008176240.745, "dur": 16447.984, + "args": { + "External id": 449804,"Sequence number": 5285405, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3339 + } + }, + { + "ph": "f", "id": 195, "pid": 4183441, "tid": 31362, "ts": 676008176240.745, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.8)", "pid": 4183441, "tid": 31362, + "ts": 676008176270.030, "dur": 41.368, + "args": { + "External id": 449805,"Record function id": 0, "Ev Idx": 3340 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.8)", "pid": 4183441, "tid": 31362, + "ts": 676008176319.272, "dur": 70.854, + "args": { + "External id": 449806,"Record function id": 0, "Ev Idx": 3341 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.8)", "pid": 4183441, "tid": 31362, + "ts": 676008176395.913, "dur": 16252.036, + "args": { + "External id": 449807,"Record function id": 0, "Ev Idx": 3342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008176483.441, "dur": 6.140, + "args": { + "External id": 449808,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008176498.774, "dur": 6.145, + "args": { + "External id": 449809,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008176521.187, "dur": 15420.630, + "args": { + "External id": 449810,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008176534.195, "dur": 15400.242, + "args": { + "External id": 449811,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008176555.912, "dur": 16.628, + "args": { + "External id": 449812,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008176577.554, "dur": 15322.415, + "args": { + "External id": 449813,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008176579.948, "dur": 15319.408, + "args": { + "External id": 449814,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008176583.603, "dur": 4.081, + "args": { + "External id": 449815,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008176589.347, "dur": 15306.262, + "args": { + "External id": 449816,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008192027.465, "dur": 9.079, + "args": { + "External id": 449817,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008192030.372, "dur": 5.733, + "args": { + "External id": 449818,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008192063.257, "dur": 319.450, + "args": { + "External id": 449819,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008192097.463, "dur": 280.666, + "args": { + "External id": 449820,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3355, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008192109.638, "dur": 263.473, + "args": { + "External id": 449821,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008192399.623, "dur": 2.096, + "args": { + "External id": 449822,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3357, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192457.224, "dur": 5.844, + "args": { + "External id": 449823,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192504.639, "dur": 1.216, + "args": { + "External id": 449824,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192521.228, "dur": 3.469, + "args": { + "External id": 449825,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192535.927, "dur": 0.814, + "args": { + "External id": 449826,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192547.165, "dur": 0.775, + "args": { + "External id": 449827,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192557.081, "dur": 0.807, + "args": { + "External id": 449828,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192567.698, "dur": 2.800, + "args": { + "External id": 449829,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192580.343, "dur": 1.820, + "args": { + "External id": 449830,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192591.663, "dur": 0.991, + "args": { + "External id": 449831,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008192714.796, "dur": 2601.371, + "args": { + "External id": 449832,"Record function id": 0, "Ev Idx": 3367 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.7)", "pid": 4183441, "tid": 31362, + "ts": 676008192736.773, "dur": 976.769, + "args": { + "External id": 449833,"Record function id": 0, "Ev Idx": 3368 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 4183441, "tid": 31362, + "ts": 676008192749.832, "dur": 297.188, + "args": { + "External id": 449834,"Record function id": 0, "Ev Idx": 3369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192836.687, "dur": 4.425, + "args": { + "External id": 449835,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192844.119, "dur": 1.250, + "args": { + "External id": 449836,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192847.372, "dur": 3.122, + "args": { + "External id": 449837,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192852.121, "dur": 0.897, + "args": { + "External id": 449838,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192854.537, "dur": 1.087, + "args": { + "External id": 449839,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192856.950, "dur": 0.984, + "args": { + "External id": 449840,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192859.418, "dur": 1.565, + "args": { + "External id": 449841,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192862.445, "dur": 0.896, + "args": { + "External id": 449842,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192864.518, "dur": 0.706, + "args": { + "External id": 449843,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008192866.624, "dur": 0.761, + "args": { + "External id": 449844,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008192883.960, "dur": 134.915, + "args": { + "External id": 449845,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008192898.801, "dur": 116.082, + "args": { + "External id": 449846,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008192911.089, "dur": 14.851, + "args": { + "External id": 449847,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008192928.672, "dur": 59.828, + "args": { + "External id": 449848,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008192931.187, "dur": 57.040, + "args": { + "External id": 449849,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008192935.204, "dur": 5.027, + "args": { + "External id": 449850,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008192941.969, "dur": 45.537, + "args": { + "External id": 449851,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3386 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.6", "pid": 4183441, "tid": 31362, + "ts": 676008193152.773, "dur": 553.702, + "args": { + "External id": 449852,"Record function id": 0, "Ev Idx": 3387 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 4183441, "tid": 31362, + "ts": 676008193167.943, "dur": 523.010, + "args": { + "External id": 449853,"Record function id": 0, "Ev Idx": 3388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008193229.727, "dur": 5.042, + "args": { + "External id": 449854,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008193249.838, "dur": 27.968, + "args": { + "External id": 449855,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193254.037, "dur": 1.534, + "args": { + "External id": 449856,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193257.703, "dur": 0.417, + "args": { + "External id": 449857,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193260.041, "dur": 0.813, + "args": { + "External id": 449858,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193262.078, "dur": 0.626, + "args": { + "External id": 449859,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193264.536, "dur": 0.318, + "args": { + "External id": 449860,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193266.084, "dur": 2.278, + "args": { + "External id": 449861,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193269.654, "dur": 0.377, + "args": { + "External id": 449862,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193271.354, "dur": 0.753, + "args": { + "External id": 449863,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193273.735, "dur": 0.412, + "args": { + "External id": 449864,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008193287.972, "dur": 33.038, + "args": { + "External id": 449865,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008193352.249, "dur": 90.807, + "args": { + "External id": 449866,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008193361.561, "dur": 2.966, + "args": { + "External id": 449867,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008193369.765, "dur": 8.791, + "args": { + "External id": 449868,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008193373.479, "dur": 4.641, + "args": { + "External id": 449869,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193376.316, "dur": 0.655, + "args": { + "External id": 449870,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008193385.074, "dur": 19.639, + "args": { + "External id": 449871,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193386.537, "dur": 0.365, + "args": { + "External id": 449872,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193388.173, "dur": 0.473, + "args": { + "External id": 449873,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193389.648, "dur": 2.551, + "args": { + "External id": 449874,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193393.750, "dur": 0.436, + "args": { + "External id": 449875,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193395.114, "dur": 0.470, + "args": { + "External id": 449876,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193397.104, "dur": 0.417, + "args": { + "External id": 449877,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193398.383, "dur": 0.410, + "args": { + "External id": 449878,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193399.963, "dur": 0.337, + "args": { + "External id": 449879,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008193401.200, "dur": 0.445, + "args": { + "External id": 449880,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008193414.665, "dur": 21.765, + "args": { + "External id": 449881,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008193489.362, "dur": 104.164, + "args": { + "External id": 449882,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008193511.590, "dur": 78.706, + "args": { + "External id": 449883,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3418, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008193520.692, "dur": 65.813, + "args": { + "External id": 449884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008193606.395, "dur": 1.788, + "args": { + "External id": 449885,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3420, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008193721.888, "dur": 1573.797, + "args": { + "External id": 449886,"Sequence number": 5285404, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3421 + } + }, + { + "ph": "f", "id": 196, "pid": 4183441, "tid": 31362, "ts": 676008193721.888, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008193831.132, "dur": 100.224, + "args": { + "External id": 449887,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008193976.011, "dur": 42.175, + "args": { + "External id": 449888,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008194034.364, "dur": 40.912, + "args": { + "External id": 449889,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194102.134, "dur": 33.265, + "args": { + "External id": 449890,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194144.811, "dur": 34.309, + "args": { + "External id": 449891,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194185.924, "dur": 22.316, + "args": { + "External id": 449892,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194215.857, "dur": 29.463, + "args": { + "External id": 449893,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008194269.169, "dur": 24.466, + "args": { + "External id": 449894,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008194310.094, "dur": 26.540, + "args": { + "External id": 449895,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008194359.178, "dur": 18.112, + "args": { + "External id": 449896,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008194389.062, "dur": 17.003, + "args": { + "External id": 449897,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194413.365, "dur": 35.469, + "args": { + "External id": 449898,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194452.187, "dur": 30.593, + "args": { + "External id": 449899,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008194509.435, "dur": 204.004, + "args": { + "External id": 449900,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008194584.290, "dur": 7.333, + "args": { + "External id": 449901,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008194593.459, "dur": 2.580, + "args": { + "External id": 449902,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008194748.947, "dur": 28.282, + "args": { + "External id": 449903,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008194788.346, "dur": 15.685, + "args": { + "External id": 449904,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194812.489, "dur": 50.770, + "args": { + "External id": 449905,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194868.542, "dur": 31.349, + "args": { + "External id": 449906,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194906.554, "dur": 27.329, + "args": { + "External id": 449907,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194940.282, "dur": 28.289, + "args": { + "External id": 449908,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008194974.411, "dur": 26.780, + "args": { + "External id": 449909,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008195007.648, "dur": 28.378, + "args": { + "External id": 449910,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008195052.065, "dur": 48.461, + "args": { + "External id": 449911,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008195132.746, "dur": 33.747, + "args": { + "External id": 449912,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008195182.995, "dur": 18.072, + "args": { + "External id": 449913,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008195216.762, "dur": 14.563, + "args": { + "External id": 449914,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008195250.398, "dur": 15.882, + "args": { + "External id": 449915,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195336.929, "dur": 17.602, + "args": { + "External id": 449916,"Record function id": 0, "Ev Idx": 3451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195339.942, "dur": 13.772, + "args": { + "External id": 449917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195344.174, "dur": 8.561, + "args": { + "External id": 449918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195345.691, "dur": 6.950, + "args": { + "External id": 449919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195358.375, "dur": 4.860, + "args": { + "External id": 449920,"Record function id": 0, "Ev Idx": 3455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195359.954, "dur": 2.861, + "args": { + "External id": 449921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195360.574, "dur": 1.696, + "args": { + "External id": 449922,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195361.421, "dur": 0.770, + "args": { + "External id": 449923,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195366.498, "dur": 4.123, + "args": { + "External id": 449924,"Record function id": 0, "Ev Idx": 3459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195367.753, "dur": 2.474, + "args": { + "External id": 449925,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195368.587, "dur": 1.178, + "args": { + "External id": 449926,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195369.064, "dur": 0.617, + "args": { + "External id": 449927,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195373.751, "dur": 4.093, + "args": { + "External id": 449928,"Record function id": 0, "Ev Idx": 3463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195375.099, "dur": 2.350, + "args": { + "External id": 449929,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195375.971, "dur": 1.071, + "args": { + "External id": 449930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195376.362, "dur": 0.597, + "args": { + "External id": 449931,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195380.897, "dur": 5.426, + "args": { + "External id": 449932,"Record function id": 0, "Ev Idx": 3467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195382.049, "dur": 3.868, + "args": { + "External id": 449933,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195382.777, "dur": 2.715, + "args": { + "External id": 449934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195383.140, "dur": 2.294, + "args": { + "External id": 449935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195389.433, "dur": 3.986, + "args": { + "External id": 449936,"Record function id": 0, "Ev Idx": 3471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195390.545, "dur": 2.481, + "args": { + "External id": 449937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195391.065, "dur": 1.397, + "args": { + "External id": 449938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195391.371, "dur": 1.022, + "args": { + "External id": 449939,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195396.530, "dur": 3.737, + "args": { + "External id": 449940,"Record function id": 0, "Ev Idx": 3475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195397.473, "dur": 2.402, + "args": { + "External id": 449941,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195397.953, "dur": 1.384, + "args": { + "External id": 449942,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195398.666, "dur": 0.605, + "args": { + "External id": 449943,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195403.432, "dur": 7.881, + "args": { + "External id": 449944,"Record function id": 0, "Ev Idx": 3479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195404.551, "dur": 6.365, + "args": { + "External id": 449945,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195405.260, "dur": 5.093, + "args": { + "External id": 449946,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195405.857, "dur": 4.429, + "args": { + "External id": 449947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195414.319, "dur": 3.654, + "args": { + "External id": 449948,"Record function id": 0, "Ev Idx": 3483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008195415.392, "dur": 2.180, + "args": { + "External id": 449949,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008195415.931, "dur": 1.106, + "args": { + "External id": 449950,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008195416.430, "dur": 0.542, + "args": { + "External id": 449951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008195421.598, "dur": 14934.709, + "args": { + "External id": 449952,"Record function id": 0, "Sequence number": 5285403, "Fwd thread id": 1, "Ev Idx": 3487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008195422.904, "dur": 14925.074, + "args": { + "External id": 449953,"Sequence number": 5285403, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3488 + } + }, + { + "ph": "f", "id": 197, "pid": 4183441, "tid": 31362, "ts": 676008195422.904, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.7)", "pid": 4183441, "tid": 31362, + "ts": 676008195449.586, "dur": 38.994, + "args": { + "External id": 449954,"Record function id": 0, "Ev Idx": 3489 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.7)", "pid": 4183441, "tid": 31362, + "ts": 676008195495.768, "dur": 67.986, + "args": { + "External id": 449955,"Record function id": 0, "Ev Idx": 3490 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.7)", "pid": 4183441, "tid": 31362, + "ts": 676008195569.320, "dur": 14771.647, + "args": { + "External id": 449956,"Record function id": 0, "Ev Idx": 3491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008195708.721, "dur": 8.159, + "args": { + "External id": 449957,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008195728.419, "dur": 5.407, + "args": { + "External id": 449958,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008195748.464, "dur": 13944.485, + "args": { + "External id": 449959,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008195765.346, "dur": 13919.403, + "args": { + "External id": 449960,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008195791.045, "dur": 14.076, + "args": { + "External id": 449961,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008195809.592, "dur": 13813.025, + "args": { + "External id": 449962,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008195812.087, "dur": 13809.715, + "args": { + "External id": 449963,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008195819.401, "dur": 6.089, + "args": { + "External id": 449964,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008195827.427, "dur": 13791.517, + "args": { + "External id": 449965,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008209778.334, "dur": 8.929, + "args": { + "External id": 449966,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008209781.152, "dur": 5.683, + "args": { + "External id": 449967,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008209814.043, "dur": 248.410, + "args": { + "External id": 449968,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008209839.764, "dur": 218.504, + "args": { + "External id": 449969,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3504, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008209850.456, "dur": 202.957, + "args": { + "External id": 449970,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008210077.977, "dur": 2.168, + "args": { + "External id": 449971,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3506, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210148.384, "dur": 6.004, + "args": { + "External id": 449972,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210195.254, "dur": 1.428, + "args": { + "External id": 449973,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210211.677, "dur": 1.377, + "args": { + "External id": 449974,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210223.982, "dur": 2.580, + "args": { + "External id": 449975,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210237.806, "dur": 0.662, + "args": { + "External id": 449976,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210248.188, "dur": 1.340, + "args": { + "External id": 449977,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210259.871, "dur": 0.894, + "args": { + "External id": 449978,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210271.560, "dur": 3.273, + "args": { + "External id": 449979,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210283.726, "dur": 0.597, + "args": { + "External id": 449980,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008210371.647, "dur": 2615.272, + "args": { + "External id": 449981,"Record function id": 0, "Ev Idx": 3516 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.6)", "pid": 4183441, "tid": 31362, + "ts": 676008210389.887, "dur": 965.725, + "args": { + "External id": 449982,"Record function id": 0, "Ev Idx": 3517 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 4183441, "tid": 31362, + "ts": 676008210402.609, "dur": 320.367, + "args": { + "External id": 449983,"Record function id": 0, "Ev Idx": 3518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210479.239, "dur": 4.101, + "args": { + "External id": 449984,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210486.162, "dur": 0.915, + "args": { + "External id": 449985,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210488.966, "dur": 0.990, + "args": { + "External id": 449986,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210491.446, "dur": 0.757, + "args": { + "External id": 449987,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210494.138, "dur": 2.020, + "args": { + "External id": 449988,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210497.572, "dur": 0.727, + "args": { + "External id": 449989,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210500.311, "dur": 1.334, + "args": { + "External id": 449990,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210503.159, "dur": 1.031, + "args": { + "External id": 449991,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210505.667, "dur": 0.757, + "args": { + "External id": 449992,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008210508.146, "dur": 0.718, + "args": { + "External id": 449993,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008210525.805, "dur": 167.422, + "args": { + "External id": 449994,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008210541.322, "dur": 146.745, + "args": { + "External id": 449995,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008210552.560, "dur": 12.254, + "args": { + "External id": 449996,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008210567.241, "dur": 58.236, + "args": { + "External id": 449997,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008210569.642, "dur": 55.462, + "args": { + "External id": 449998,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210573.122, "dur": 5.304, + "args": { + "External id": 449999,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008210580.408, "dur": 43.930, + "args": { + "External id": 450000,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3535 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.5", "pid": 4183441, "tid": 31362, + "ts": 676008210809.119, "dur": 539.059, + "args": { + "External id": 450001,"Record function id": 0, "Ev Idx": 3536 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 4183441, "tid": 31362, + "ts": 676008210826.544, "dur": 509.473, + "args": { + "External id": 450002,"Record function id": 0, "Ev Idx": 3537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008210890.715, "dur": 6.473, + "args": { + "External id": 450003,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008210911.737, "dur": 27.022, + "args": { + "External id": 450004,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210916.043, "dur": 1.603, + "args": { + "External id": 450005,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210919.125, "dur": 0.762, + "args": { + "External id": 450006,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210921.510, "dur": 0.414, + "args": { + "External id": 450007,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210922.979, "dur": 0.530, + "args": { + "External id": 450008,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210924.754, "dur": 0.257, + "args": { + "External id": 450009,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210926.189, "dur": 0.449, + "args": { + "External id": 450010,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210927.858, "dur": 0.323, + "args": { + "External id": 450011,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210929.085, "dur": 1.615, + "args": { + "External id": 450012,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008210931.763, "dur": 0.260, + "args": { + "External id": 450013,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008210948.986, "dur": 32.246, + "args": { + "External id": 450014,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008211013.979, "dur": 111.942, + "args": { + "External id": 450015,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008211023.883, "dur": 3.227, + "args": { + "External id": 450016,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008211032.673, "dur": 9.496, + "args": { + "External id": 450017,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008211036.680, "dur": 5.073, + "args": { + "External id": 450018,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211039.730, "dur": 0.683, + "args": { + "External id": 450019,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008211050.114, "dur": 21.444, + "args": { + "External id": 450020,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211051.775, "dur": 0.514, + "args": { + "External id": 450021,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211053.603, "dur": 0.609, + "args": { + "External id": 450022,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211055.783, "dur": 0.530, + "args": { + "External id": 450023,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211057.598, "dur": 0.348, + "args": { + "External id": 450024,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211059.636, "dur": 2.496, + "args": { + "External id": 450025,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211062.988, "dur": 0.354, + "args": { + "External id": 450026,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211064.897, "dur": 0.267, + "args": { + "External id": 450027,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211066.476, "dur": 0.385, + "args": { + "External id": 450028,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008211068.733, "dur": 0.392, + "args": { + "External id": 450029,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008211095.147, "dur": 22.262, + "args": { + "External id": 450030,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008211170.253, "dur": 102.692, + "args": { + "External id": 450031,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008211192.542, "dur": 77.159, + "args": { + "External id": 450032,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3567, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008211202.456, "dur": 63.467, + "args": { + "External id": 450033,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008211285.958, "dur": 1.518, + "args": { + "External id": 450034,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3569, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008211362.174, "dur": 1601.860, + "args": { + "External id": 450035,"Sequence number": 5285402, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3570 + } + }, + { + "ph": "f", "id": 198, "pid": 4183441, "tid": 31362, "ts": 676008211362.174, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008211473.974, "dur": 95.564, + "args": { + "External id": 450036,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008211608.759, "dur": 37.212, + "args": { + "External id": 450037,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008211704.784, "dur": 51.288, + "args": { + "External id": 450038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008211766.116, "dur": 29.831, + "args": { + "External id": 450039,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008211802.310, "dur": 33.647, + "args": { + "External id": 450040,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008211843.496, "dur": 21.706, + "args": { + "External id": 450041,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008211875.366, "dur": 29.179, + "args": { + "External id": 450042,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008211927.850, "dur": 27.405, + "args": { + "External id": 450043,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008211973.221, "dur": 27.244, + "args": { + "External id": 450044,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008212017.546, "dur": 19.650, + "args": { + "External id": 450045,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008212048.502, "dur": 14.403, + "args": { + "External id": 450046,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212071.797, "dur": 55.611, + "args": { + "External id": 450047,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212132.326, "dur": 32.350, + "args": { + "External id": 450048,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008212209.638, "dur": 163.085, + "args": { + "External id": 450049,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008212282.409, "dur": 6.349, + "args": { + "External id": 450050,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008212290.535, "dur": 2.462, + "args": { + "External id": 450051,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008212403.789, "dur": 24.771, + "args": { + "External id": 450052,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008212439.272, "dur": 14.817, + "args": { + "External id": 450053,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212462.652, "dur": 43.071, + "args": { + "External id": 450054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212513.221, "dur": 33.495, + "args": { + "External id": 450055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212552.207, "dur": 27.693, + "args": { + "External id": 450056,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212584.796, "dur": 29.973, + "args": { + "External id": 450057,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212620.149, "dur": 27.146, + "args": { + "External id": 450058,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008212693.339, "dur": 34.584, + "args": { + "External id": 450059,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008212746.909, "dur": 23.056, + "args": { + "External id": 450060,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008212791.694, "dur": 36.676, + "args": { + "External id": 450061,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008212850.421, "dur": 24.122, + "args": { + "External id": 450062,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008212890.851, "dur": 14.789, + "args": { + "External id": 450063,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008212917.416, "dur": 19.996, + "args": { + "External id": 450064,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213009.014, "dur": 13.793, + "args": { + "External id": 450065,"Record function id": 0, "Ev Idx": 3600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213011.899, "dur": 10.131, + "args": { + "External id": 450066,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213015.760, "dur": 5.472, + "args": { + "External id": 450067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213017.009, "dur": 4.126, + "args": { + "External id": 450068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213026.526, "dur": 4.400, + "args": { + "External id": 450069,"Record function id": 0, "Ev Idx": 3604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213028.059, "dur": 2.447, + "args": { + "External id": 450070,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213028.733, "dur": 1.284, + "args": { + "External id": 450071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213029.106, "dur": 0.827, + "args": { + "External id": 450072,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213034.129, "dur": 9.266, + "args": { + "External id": 450073,"Record function id": 0, "Ev Idx": 3608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213035.421, "dur": 7.535, + "args": { + "External id": 450074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213036.007, "dur": 6.420, + "args": { + "External id": 450075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213036.353, "dur": 5.972, + "args": { + "External id": 450076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213046.660, "dur": 4.261, + "args": { + "External id": 450077,"Record function id": 0, "Ev Idx": 3612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213047.992, "dur": 2.525, + "args": { + "External id": 450078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213048.665, "dur": 1.225, + "args": { + "External id": 450079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213049.105, "dur": 0.720, + "args": { + "External id": 450080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213054.034, "dur": 3.454, + "args": { + "External id": 450081,"Record function id": 0, "Ev Idx": 3616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213055.226, "dur": 1.856, + "args": { + "External id": 450082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213055.694, "dur": 0.983, + "args": { + "External id": 450083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213056.072, "dur": 0.533, + "args": { + "External id": 450084,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213060.567, "dur": 3.747, + "args": { + "External id": 450085,"Record function id": 0, "Ev Idx": 3620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213061.815, "dur": 2.106, + "args": { + "External id": 450086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213062.385, "dur": 1.123, + "args": { + "External id": 450087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213062.831, "dur": 0.612, + "args": { + "External id": 450088,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213067.558, "dur": 3.827, + "args": { + "External id": 450089,"Record function id": 0, "Ev Idx": 3624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213068.963, "dur": 2.029, + "args": { + "External id": 450090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213069.489, "dur": 1.068, + "args": { + "External id": 450091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213069.923, "dur": 0.569, + "args": { + "External id": 450092,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213074.418, "dur": 3.816, + "args": { + "External id": 450093,"Record function id": 0, "Ev Idx": 3628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213075.712, "dur": 2.125, + "args": { + "External id": 450094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213076.198, "dur": 1.253, + "args": { + "External id": 450095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213076.677, "dur": 0.704, + "args": { + "External id": 450096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213099.016, "dur": 7.774, + "args": { + "External id": 450097,"Record function id": 0, "Ev Idx": 3632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008213102.087, "dur": 4.045, + "args": { + "External id": 450098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008213103.106, "dur": 2.203, + "args": { + "External id": 450099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008213103.767, "dur": 1.318, + "args": { + "External id": 450100,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008213112.016, "dur": 14886.749, + "args": { + "External id": 450101,"Record function id": 0, "Sequence number": 5285401, "Fwd thread id": 1, "Ev Idx": 3636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008213113.345, "dur": 14876.543, + "args": { + "External id": 450102,"Sequence number": 5285401, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3637 + } + }, + { + "ph": "f", "id": 199, "pid": 4183441, "tid": 31362, "ts": 676008213113.345, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.6)", "pid": 4183441, "tid": 31362, + "ts": 676008213143.086, "dur": 40.705, + "args": { + "External id": 450103,"Record function id": 0, "Ev Idx": 3638 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.6)", "pid": 4183441, "tid": 31362, + "ts": 676008213191.211, "dur": 71.095, + "args": { + "External id": 450104,"Record function id": 0, "Ev Idx": 3639 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.6)", "pid": 4183441, "tid": 31362, + "ts": 676008213268.311, "dur": 14714.822, + "args": { + "External id": 450105,"Record function id": 0, "Ev Idx": 3640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008213360.663, "dur": 6.660, + "args": { + "External id": 450106,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008213376.759, "dur": 6.333, + "args": { + "External id": 450107,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008213399.436, "dur": 13924.897, + "args": { + "External id": 450108,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008213413.524, "dur": 13903.158, + "args": { + "External id": 450109,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008213435.905, "dur": 16.604, + "args": { + "External id": 450110,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008213457.011, "dur": 13825.261, + "args": { + "External id": 450111,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008213459.427, "dur": 13822.121, + "args": { + "External id": 450112,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008213463.569, "dur": 4.864, + "args": { + "External id": 450113,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008213470.220, "dur": 13807.697, + "args": { + "External id": 450114,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008227407.726, "dur": 8.362, + "args": { + "External id": 450115,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008227410.557, "dur": 5.121, + "args": { + "External id": 450116,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008227442.166, "dur": 276.714, + "args": { + "External id": 450117,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008227466.537, "dur": 247.770, + "args": { + "External id": 450118,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3653, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008227477.480, "dur": 231.402, + "args": { + "External id": 450119,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008227736.100, "dur": 2.297, + "args": { + "External id": 450120,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3655, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227790.512, "dur": 6.372, + "args": { + "External id": 450121,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227837.913, "dur": 1.110, + "args": { + "External id": 450122,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227854.346, "dur": 1.218, + "args": { + "External id": 450123,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227866.401, "dur": 2.731, + "args": { + "External id": 450124,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227880.140, "dur": 0.781, + "args": { + "External id": 450125,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227890.476, "dur": 0.823, + "args": { + "External id": 450126,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227901.218, "dur": 0.908, + "args": { + "External id": 450127,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227913.651, "dur": 3.293, + "args": { + "External id": 450128,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008227926.964, "dur": 0.702, + "args": { + "External id": 450129,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008228012.769, "dur": 2581.430, + "args": { + "External id": 450130,"Record function id": 0, "Ev Idx": 3665 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.5)", "pid": 4183441, "tid": 31362, + "ts": 676008228032.162, "dur": 968.451, + "args": { + "External id": 450131,"Record function id": 0, "Ev Idx": 3666 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 4183441, "tid": 31362, + "ts": 676008228046.349, "dur": 305.584, + "args": { + "External id": 450132,"Record function id": 0, "Ev Idx": 3667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228143.595, "dur": 4.721, + "args": { + "External id": 450133,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228151.822, "dur": 1.197, + "args": { + "External id": 450134,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228154.914, "dur": 0.772, + "args": { + "External id": 450135,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228157.594, "dur": 0.867, + "args": { + "External id": 450136,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228160.213, "dur": 2.488, + "args": { + "External id": 450137,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228164.397, "dur": 0.853, + "args": { + "External id": 450138,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228166.845, "dur": 1.260, + "args": { + "External id": 450139,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228169.731, "dur": 0.910, + "args": { + "External id": 450140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228172.111, "dur": 0.664, + "args": { + "External id": 450141,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008228174.266, "dur": 0.817, + "args": { + "External id": 450142,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008228192.689, "dur": 132.873, + "args": { + "External id": 450143,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008228208.361, "dur": 113.163, + "args": { + "External id": 450144,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008228220.474, "dur": 11.416, + "args": { + "External id": 450145,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008228234.854, "dur": 58.833, + "args": { + "External id": 450146,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008228237.209, "dur": 56.137, + "args": { + "External id": 450147,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228240.833, "dur": 5.933, + "args": { + "External id": 450148,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008228248.393, "dur": 44.418, + "args": { + "External id": 450149,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3684 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.4", "pid": 4183441, "tid": 31362, + "ts": 676008228438.896, "dur": 553.786, + "args": { + "External id": 450150,"Record function id": 0, "Ev Idx": 3685 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 4183441, "tid": 31362, + "ts": 676008228454.847, "dur": 525.638, + "args": { + "External id": 450151,"Record function id": 0, "Ev Idx": 3686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008228513.520, "dur": 8.843, + "args": { + "External id": 450152,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008228536.294, "dur": 24.820, + "args": { + "External id": 450153,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228540.180, "dur": 1.444, + "args": { + "External id": 450154,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228543.401, "dur": 0.386, + "args": { + "External id": 450155,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228545.259, "dur": 0.243, + "args": { + "External id": 450156,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228546.907, "dur": 0.708, + "args": { + "External id": 450157,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228549.287, "dur": 0.419, + "args": { + "External id": 450158,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228550.941, "dur": 0.576, + "args": { + "External id": 450159,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228552.821, "dur": 0.460, + "args": { + "External id": 450160,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228554.561, "dur": 2.401, + "args": { + "External id": 450161,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228558.030, "dur": 0.439, + "args": { + "External id": 450162,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008228570.600, "dur": 32.233, + "args": { + "External id": 450163,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008228631.589, "dur": 136.100, + "args": { + "External id": 450164,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008228640.317, "dur": 3.113, + "args": { + "External id": 450165,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008228648.099, "dur": 46.447, + "args": { + "External id": 450166,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008228687.700, "dur": 6.419, + "args": { + "External id": 450167,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228691.408, "dur": 0.930, + "args": { + "External id": 450168,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008228703.015, "dur": 21.078, + "args": { + "External id": 450169,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228704.569, "dur": 0.518, + "args": { + "External id": 450170,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228706.359, "dur": 0.343, + "args": { + "External id": 450171,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228707.852, "dur": 0.372, + "args": { + "External id": 450172,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228709.653, "dur": 0.637, + "args": { + "External id": 450173,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228711.146, "dur": 1.904, + "args": { + "External id": 450174,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228713.982, "dur": 0.444, + "args": { + "External id": 450175,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228715.205, "dur": 0.760, + "args": { + "External id": 450176,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228716.995, "dur": 0.391, + "args": { + "External id": 450177,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008228718.268, "dur": 0.405, + "args": { + "External id": 450178,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008228735.662, "dur": 24.001, + "args": { + "External id": 450179,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008228813.387, "dur": 104.415, + "args": { + "External id": 450180,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008228835.140, "dur": 79.494, + "args": { + "External id": 450181,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3716, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008228844.485, "dur": 65.394, + "args": { + "External id": 450182,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008228930.379, "dur": 1.832, + "args": { + "External id": 450183,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3718, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008229008.262, "dur": 1560.891, + "args": { + "External id": 450184,"Sequence number": 5285400, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3719 + } + }, + { + "ph": "f", "id": 200, "pid": 4183441, "tid": 31362, "ts": 676008229008.262, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008229138.454, "dur": 99.873, + "args": { + "External id": 450185,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008229278.608, "dur": 38.633, + "args": { + "External id": 450186,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008229333.965, "dur": 39.500, + "args": { + "External id": 450187,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008229382.829, "dur": 26.256, + "args": { + "External id": 450188,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008229414.535, "dur": 32.374, + "args": { + "External id": 450189,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008229454.078, "dur": 19.799, + "args": { + "External id": 450190,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008229481.297, "dur": 28.578, + "args": { + "External id": 450191,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008229534.385, "dur": 20.798, + "args": { + "External id": 450192,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008229573.925, "dur": 29.616, + "args": { + "External id": 450193,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008229622.507, "dur": 21.215, + "args": { + "External id": 450194,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008229693.855, "dur": 20.221, + "args": { + "External id": 450195,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008229725.931, "dur": 43.025, + "args": { + "External id": 450196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008229772.682, "dur": 31.204, + "args": { + "External id": 450197,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008229830.375, "dur": 161.557, + "args": { + "External id": 450198,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008229903.424, "dur": 5.628, + "args": { + "External id": 450199,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008229910.739, "dur": 2.704, + "args": { + "External id": 450200,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008230025.121, "dur": 25.548, + "args": { + "External id": 450201,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008230063.637, "dur": 14.410, + "args": { + "External id": 450202,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008230102.156, "dur": 54.028, + "args": { + "External id": 450203,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008230164.101, "dur": 33.983, + "args": { + "External id": 450204,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008230204.789, "dur": 28.105, + "args": { + "External id": 450205,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008230237.008, "dur": 28.442, + "args": { + "External id": 450206,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008230270.348, "dur": 26.852, + "args": { + "External id": 450207,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008230305.811, "dur": 29.309, + "args": { + "External id": 450208,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008230352.391, "dur": 22.336, + "args": { + "External id": 450209,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008230395.209, "dur": 25.085, + "args": { + "External id": 450210,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008230434.908, "dur": 20.014, + "args": { + "External id": 450211,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008230483.419, "dur": 23.151, + "args": { + "External id": 450212,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008230521.464, "dur": 19.444, + "args": { + "External id": 450213,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230614.816, "dur": 14.135, + "args": { + "External id": 450214,"Record function id": 0, "Ev Idx": 3749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230618.189, "dur": 9.950, + "args": { + "External id": 450215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230622.205, "dur": 5.131, + "args": { + "External id": 450216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230623.506, "dur": 3.738, + "args": { + "External id": 450217,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230632.662, "dur": 4.479, + "args": { + "External id": 450218,"Record function id": 0, "Ev Idx": 3753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230633.962, "dur": 2.765, + "args": { + "External id": 450219,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230634.811, "dur": 1.422, + "args": { + "External id": 450220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230635.186, "dur": 0.968, + "args": { + "External id": 450221,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230640.348, "dur": 4.370, + "args": { + "External id": 450222,"Record function id": 0, "Ev Idx": 3757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230641.731, "dur": 2.545, + "args": { + "External id": 450223,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230642.263, "dur": 1.432, + "args": { + "External id": 450224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230642.856, "dur": 0.755, + "args": { + "External id": 450225,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230685.632, "dur": 8.921, + "args": { + "External id": 450226,"Record function id": 0, "Ev Idx": 3761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230688.129, "dur": 5.742, + "args": { + "External id": 450227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230689.402, "dur": 3.587, + "args": { + "External id": 450228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230689.988, "dur": 2.765, + "args": { + "External id": 450229,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230698.923, "dur": 4.821, + "args": { + "External id": 450230,"Record function id": 0, "Ev Idx": 3765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230700.460, "dur": 2.880, + "args": { + "External id": 450231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230701.126, "dur": 1.599, + "args": { + "External id": 450232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230701.664, "dur": 0.957, + "args": { + "External id": 450233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230709.940, "dur": 4.352, + "args": { + "External id": 450234,"Record function id": 0, "Ev Idx": 3769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230711.369, "dur": 2.495, + "args": { + "External id": 450235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230711.931, "dur": 1.372, + "args": { + "External id": 450236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230712.604, "dur": 0.605, + "args": { + "External id": 450237,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230717.525, "dur": 3.871, + "args": { + "External id": 450238,"Record function id": 0, "Ev Idx": 3773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230718.869, "dur": 2.121, + "args": { + "External id": 450239,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230719.324, "dur": 1.246, + "args": { + "External id": 450240,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230719.810, "dur": 0.666, + "args": { + "External id": 450241,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230724.449, "dur": 3.922, + "args": { + "External id": 450242,"Record function id": 0, "Ev Idx": 3777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230725.429, "dur": 2.530, + "args": { + "External id": 450243,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230725.934, "dur": 1.496, + "args": { + "External id": 450244,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230726.463, "dur": 0.873, + "args": { + "External id": 450245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230731.789, "dur": 3.991, + "args": { + "External id": 450246,"Record function id": 0, "Ev Idx": 3781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008230732.860, "dur": 2.508, + "args": { + "External id": 450247,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008230733.473, "dur": 1.486, + "args": { + "External id": 450248,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008230733.943, "dur": 0.926, + "args": { + "External id": 450249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008230739.853, "dur": 14851.727, + "args": { + "External id": 450250,"Record function id": 0, "Sequence number": 5285399, "Fwd thread id": 1, "Ev Idx": 3785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008230741.444, "dur": 14842.420, + "args": { + "External id": 450251,"Sequence number": 5285399, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3786 + } + }, + { + "ph": "f", "id": 201, "pid": 4183441, "tid": 31362, "ts": 676008230741.444, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.5)", "pid": 4183441, "tid": 31362, + "ts": 676008230769.978, "dur": 35.142, + "args": { + "External id": 450252,"Record function id": 0, "Ev Idx": 3787 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.5)", "pid": 4183441, "tid": 31362, + "ts": 676008230812.543, "dur": 70.458, + "args": { + "External id": 450253,"Record function id": 0, "Ev Idx": 3788 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.5)", "pid": 4183441, "tid": 31362, + "ts": 676008230888.306, "dur": 14688.104, + "args": { + "External id": 450254,"Record function id": 0, "Ev Idx": 3789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008230978.342, "dur": 6.611, + "args": { + "External id": 450255,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008230994.089, "dur": 4.639, + "args": { + "External id": 450256,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008231011.876, "dur": 13864.821, + "args": { + "External id": 450257,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008231024.753, "dur": 13844.361, + "args": { + "External id": 450258,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008231053.952, "dur": 15.196, + "args": { + "External id": 450259,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008231073.583, "dur": 13760.210, + "args": { + "External id": 450260,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008231076.047, "dur": 13757.139, + "args": { + "External id": 450261,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008231080.131, "dur": 21.841, + "args": { + "External id": 450262,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008231104.455, "dur": 13725.672, + "args": { + "External id": 450263,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008244963.219, "dur": 8.841, + "args": { + "External id": 450264,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008244966.055, "dur": 5.564, + "args": { + "External id": 450265,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008244998.937, "dur": 307.026, + "args": { + "External id": 450266,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008245023.232, "dur": 277.846, + "args": { + "External id": 450267,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3802, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008245034.404, "dur": 261.653, + "args": { + "External id": 450268,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008245323.238, "dur": 2.099, + "args": { + "External id": 450269,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3804, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245378.882, "dur": 6.146, + "args": { + "External id": 450270,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245425.836, "dur": 1.241, + "args": { + "External id": 450271,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245442.774, "dur": 1.288, + "args": { + "External id": 450272,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245456.786, "dur": 2.805, + "args": { + "External id": 450273,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245470.287, "dur": 0.717, + "args": { + "External id": 450274,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245480.814, "dur": 0.959, + "args": { + "External id": 450275,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245492.184, "dur": 0.849, + "args": { + "External id": 450276,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245503.633, "dur": 3.175, + "args": { + "External id": 450277,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245516.682, "dur": 0.718, + "args": { + "External id": 450278,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008245605.505, "dur": 2589.156, + "args": { + "External id": 450279,"Record function id": 0, "Ev Idx": 3814 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.4)", "pid": 4183441, "tid": 31362, + "ts": 676008245626.199, "dur": 961.564, + "args": { + "External id": 450280,"Record function id": 0, "Ev Idx": 3815 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 4183441, "tid": 31362, + "ts": 676008245640.055, "dur": 327.844, + "args": { + "External id": 450281,"Record function id": 0, "Ev Idx": 3816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245758.880, "dur": 4.856, + "args": { + "External id": 450282,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245766.802, "dur": 1.284, + "args": { + "External id": 450283,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245770.012, "dur": 0.772, + "args": { + "External id": 450284,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245772.479, "dur": 0.875, + "args": { + "External id": 450285,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245774.855, "dur": 2.597, + "args": { + "External id": 450286,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245779.140, "dur": 1.045, + "args": { + "External id": 450287,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245781.785, "dur": 1.114, + "args": { + "External id": 450288,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245784.485, "dur": 0.900, + "args": { + "External id": 450289,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245786.839, "dur": 1.132, + "args": { + "External id": 450290,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008245789.593, "dur": 1.254, + "args": { + "External id": 450291,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008245808.117, "dur": 131.853, + "args": { + "External id": 450292,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008245823.466, "dur": 112.799, + "args": { + "External id": 450293,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008245835.938, "dur": 12.627, + "args": { + "External id": 450294,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008245851.235, "dur": 59.704, + "args": { + "External id": 450295,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008245854.051, "dur": 56.580, + "args": { + "External id": 450296,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008245857.295, "dur": 5.211, + "args": { + "External id": 450297,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008245864.046, "dur": 45.925, + "args": { + "External id": 450298,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3833 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.3", "pid": 4183441, "tid": 31362, + "ts": 676008246052.823, "dur": 527.373, + "args": { + "External id": 450299,"Record function id": 0, "Ev Idx": 3834 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 4183441, "tid": 31362, + "ts": 676008246070.123, "dur": 498.103, + "args": { + "External id": 450300,"Record function id": 0, "Ev Idx": 3835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008246151.671, "dur": 6.997, + "args": { + "External id": 450301,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008246173.587, "dur": 27.554, + "args": { + "External id": 450302,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246177.686, "dur": 1.340, + "args": { + "External id": 450303,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246181.093, "dur": 0.366, + "args": { + "External id": 450304,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246182.850, "dur": 0.812, + "args": { + "External id": 450305,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246187.650, "dur": 0.418, + "args": { + "External id": 450306,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246189.009, "dur": 0.402, + "args": { + "External id": 450307,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246190.622, "dur": 0.204, + "args": { + "External id": 450308,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246191.735, "dur": 0.427, + "args": { + "External id": 450309,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246193.587, "dur": 1.503, + "args": { + "External id": 450310,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246195.953, "dur": 0.374, + "args": { + "External id": 450311,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008246211.608, "dur": 32.160, + "args": { + "External id": 450312,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008246274.478, "dur": 91.215, + "args": { + "External id": 450313,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008246283.697, "dur": 3.272, + "args": { + "External id": 450314,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008246292.154, "dur": 9.557, + "args": { + "External id": 450315,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008246296.045, "dur": 5.208, + "args": { + "External id": 450316,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 3851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246299.308, "dur": 0.488, + "args": { + "External id": 450317,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008246308.183, "dur": 20.462, + "args": { + "External id": 450318,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246309.788, "dur": 0.584, + "args": { + "External id": 450319,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246311.798, "dur": 0.319, + "args": { + "External id": 450320,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246312.925, "dur": 0.342, + "args": { + "External id": 450321,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246314.465, "dur": 0.345, + "args": { + "External id": 450322,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246315.591, "dur": 1.782, + "args": { + "External id": 450323,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246318.354, "dur": 0.295, + "args": { + "External id": 450324,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246319.478, "dur": 0.376, + "args": { + "External id": 450325,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246320.774, "dur": 0.266, + "args": { + "External id": 450326,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008246321.924, "dur": 0.421, + "args": { + "External id": 450327,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008246338.261, "dur": 19.609, + "args": { + "External id": 450328,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008246407.356, "dur": 100.975, + "args": { + "External id": 450329,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 3864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008246428.418, "dur": 76.756, + "args": { + "External id": 450330,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3865, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008246437.361, "dur": 63.936, + "args": { + "External id": 450331,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 3866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008246520.780, "dur": 1.682, + "args": { + "External id": 450332,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3867, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008246593.994, "dur": 1579.770, + "args": { + "External id": 450333,"Sequence number": 5285398, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3868 + } + }, + { + "ph": "f", "id": 202, "pid": 4183441, "tid": 31362, "ts": 676008246593.994, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008246742.330, "dur": 99.144, + "args": { + "External id": 450334,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 3869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008246880.366, "dur": 37.063, + "args": { + "External id": 450335,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 3870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008246933.540, "dur": 40.329, + "args": { + "External id": 450336,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 3871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008246982.879, "dur": 26.848, + "args": { + "External id": 450337,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247015.900, "dur": 33.124, + "args": { + "External id": 450338,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247056.983, "dur": 21.645, + "args": { + "External id": 450339,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 3874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247104.122, "dur": 33.798, + "args": { + "External id": 450340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 3875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008247162.046, "dur": 22.935, + "args": { + "External id": 450341,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 3876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008247202.668, "dur": 26.103, + "args": { + "External id": 450342,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008247247.904, "dur": 17.972, + "args": { + "External id": 450343,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008247276.781, "dur": 16.485, + "args": { + "External id": 450344,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247303.089, "dur": 35.857, + "args": { + "External id": 450345,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247342.017, "dur": 33.641, + "args": { + "External id": 450346,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008247400.594, "dur": 172.286, + "args": { + "External id": 450347,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008247485.382, "dur": 5.265, + "args": { + "External id": 450348,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008247492.303, "dur": 2.413, + "args": { + "External id": 450349,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008247602.811, "dur": 22.959, + "args": { + "External id": 450350,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008247636.313, "dur": 12.992, + "args": { + "External id": 450351,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247694.703, "dur": 49.527, + "args": { + "External id": 450352,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247752.279, "dur": 33.553, + "args": { + "External id": 450353,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247792.097, "dur": 27.897, + "args": { + "External id": 450354,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247824.462, "dur": 31.456, + "args": { + "External id": 450355,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247861.187, "dur": 27.591, + "args": { + "External id": 450356,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 3891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008247898.339, "dur": 28.345, + "args": { + "External id": 450357,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 3892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008247946.973, "dur": 21.123, + "args": { + "External id": 450358,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 3893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008247984.198, "dur": 26.003, + "args": { + "External id": 450359,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008248023.745, "dur": 27.368, + "args": { + "External id": 450360,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 3895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008248074.020, "dur": 34.986, + "args": { + "External id": 450361,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 3896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008248125.297, "dur": 16.333, + "args": { + "External id": 450362,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 3897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248214.915, "dur": 17.040, + "args": { + "External id": 450363,"Record function id": 0, "Ev Idx": 3898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248217.658, "dur": 13.415, + "args": { + "External id": 450364,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248224.851, "dur": 5.354, + "args": { + "External id": 450365,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248226.117, "dur": 3.987, + "args": { + "External id": 450366,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248235.671, "dur": 4.493, + "args": { + "External id": 450367,"Record function id": 0, "Ev Idx": 3902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248236.977, "dur": 2.756, + "args": { + "External id": 450368,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248238.071, "dur": 1.240, + "args": { + "External id": 450369,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248238.444, "dur": 0.798, + "args": { + "External id": 450370,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248243.259, "dur": 3.991, + "args": { + "External id": 450371,"Record function id": 0, "Ev Idx": 3906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248244.397, "dur": 2.434, + "args": { + "External id": 450372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248245.122, "dur": 1.262, + "args": { + "External id": 450373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248245.677, "dur": 0.620, + "args": { + "External id": 450374,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 3909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248250.407, "dur": 5.290, + "args": { + "External id": 450375,"Record function id": 0, "Ev Idx": 3910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248252.030, "dur": 3.246, + "args": { + "External id": 450376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248252.546, "dur": 2.325, + "args": { + "External id": 450377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248252.974, "dur": 1.826, + "args": { + "External id": 450378,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 3913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248258.863, "dur": 4.373, + "args": { + "External id": 450379,"Record function id": 0, "Ev Idx": 3914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248260.405, "dur": 2.385, + "args": { + "External id": 450380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248260.942, "dur": 1.424, + "args": { + "External id": 450381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248261.446, "dur": 0.853, + "args": { + "External id": 450382,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248266.398, "dur": 4.161, + "args": { + "External id": 450383,"Record function id": 0, "Ev Idx": 3918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248267.521, "dur": 2.638, + "args": { + "External id": 450384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248268.443, "dur": 1.295, + "args": { + "External id": 450385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248269.074, "dur": 0.598, + "args": { + "External id": 450386,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248273.704, "dur": 4.471, + "args": { + "External id": 450387,"Record function id": 0, "Ev Idx": 3922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248274.896, "dur": 2.890, + "args": { + "External id": 450388,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248275.722, "dur": 1.629, + "args": { + "External id": 450389,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248276.397, "dur": 0.888, + "args": { + "External id": 450390,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248287.370, "dur": 3.553, + "args": { + "External id": 450391,"Record function id": 0, "Ev Idx": 3926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248288.464, "dur": 2.077, + "args": { + "External id": 450392,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248288.947, "dur": 1.178, + "args": { + "External id": 450393,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248289.448, "dur": 0.613, + "args": { + "External id": 450394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 3929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248293.890, "dur": 5.031, + "args": { + "External id": 450395,"Record function id": 0, "Ev Idx": 3930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008248294.958, "dur": 3.551, + "args": { + "External id": 450396,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008248295.877, "dur": 2.229, + "args": { + "External id": 450397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008248297.361, "dur": 0.679, + "args": { + "External id": 450398,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 3933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008248302.486, "dur": 14881.661, + "args": { + "External id": 450399,"Record function id": 0, "Sequence number": 5285397, "Fwd thread id": 1, "Ev Idx": 3934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008248303.981, "dur": 14871.416, + "args": { + "External id": 450400,"Sequence number": 5285397, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 3935 + } + }, + { + "ph": "f", "id": 203, "pid": 4183441, "tid": 31362, "ts": 676008248303.981, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.4)", "pid": 4183441, "tid": 31362, + "ts": 676008248333.009, "dur": 41.114, + "args": { + "External id": 450401,"Record function id": 0, "Ev Idx": 3936 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.4)", "pid": 4183441, "tid": 31362, + "ts": 676008248382.064, "dur": 67.620, + "args": { + "External id": 450402,"Record function id": 0, "Ev Idx": 3937 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.4)", "pid": 4183441, "tid": 31362, + "ts": 676008248455.299, "dur": 14712.429, + "args": { + "External id": 450403,"Record function id": 0, "Ev Idx": 3938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008248546.384, "dur": 6.783, + "args": { + "External id": 450404,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008248563.166, "dur": 4.355, + "args": { + "External id": 450405,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008248584.098, "dur": 13890.966, + "args": { + "External id": 450406,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008248596.891, "dur": 13870.110, + "args": { + "External id": 450407,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 3942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008248622.083, "dur": 14.783, + "args": { + "External id": 450408,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008248641.434, "dur": 13789.836, + "args": { + "External id": 450409,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 3944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008248643.663, "dur": 13786.936, + "args": { + "External id": 450410,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 3945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008248647.630, "dur": 40.895, + "args": { + "External id": 450411,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008248691.599, "dur": 13735.534, + "args": { + "External id": 450412,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 3947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008262563.648, "dur": 9.007, + "args": { + "External id": 450413,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 3948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008262566.657, "dur": 5.575, + "args": { + "External id": 450414,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008262601.063, "dur": 274.363, + "args": { + "External id": 450415,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 3950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008262625.764, "dur": 245.001, + "args": { + "External id": 450416,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3951, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008262637.043, "dur": 228.932, + "args": { + "External id": 450417,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 3952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008262892.316, "dur": 2.093, + "args": { + "External id": 450418,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3953, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008262949.173, "dur": 5.967, + "args": { + "External id": 450419,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008262998.458, "dur": 1.449, + "args": { + "External id": 450420,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263015.271, "dur": 1.385, + "args": { + "External id": 450421,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263027.424, "dur": 2.288, + "args": { + "External id": 450422,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263040.273, "dur": 1.003, + "args": { + "External id": 450423,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263051.194, "dur": 1.170, + "args": { + "External id": 450424,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263061.986, "dur": 0.892, + "args": { + "External id": 450425,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263073.118, "dur": 2.429, + "args": { + "External id": 450426,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263102.426, "dur": 1.908, + "args": { + "External id": 450427,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008263198.544, "dur": 2626.904, + "args": { + "External id": 450428,"Record function id": 0, "Ev Idx": 3963 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.3)", "pid": 4183441, "tid": 31362, + "ts": 676008263217.253, "dur": 978.161, + "args": { + "External id": 450429,"Record function id": 0, "Ev Idx": 3964 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 4183441, "tid": 31362, + "ts": 676008263232.089, "dur": 284.748, + "args": { + "External id": 450430,"Record function id": 0, "Ev Idx": 3965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263313.351, "dur": 4.058, + "args": { + "External id": 450431,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 3966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263320.686, "dur": 1.032, + "args": { + "External id": 450432,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263323.386, "dur": 0.918, + "args": { + "External id": 450433,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263325.911, "dur": 0.807, + "args": { + "External id": 450434,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263328.122, "dur": 1.976, + "args": { + "External id": 450435,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263331.614, "dur": 1.219, + "args": { + "External id": 450436,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 3971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263334.339, "dur": 0.985, + "args": { + "External id": 450437,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 3972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263336.765, "dur": 1.249, + "args": { + "External id": 450438,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263339.865, "dur": 1.165, + "args": { + "External id": 450439,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008263342.393, "dur": 1.184, + "args": { + "External id": 450440,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 3975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008263360.179, "dur": 130.400, + "args": { + "External id": 450441,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008263374.811, "dur": 111.889, + "args": { + "External id": 450442,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 3977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008263386.233, "dur": 12.762, + "args": { + "External id": 450443,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008263401.492, "dur": 57.840, + "args": { + "External id": 450444,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 3979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008263404.263, "dur": 54.738, + "args": { + "External id": 450445,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 3980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263407.833, "dur": 4.591, + "args": { + "External id": 450446,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008263414.210, "dur": 44.195, + "args": { + "External id": 450447,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 3982 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.2", "pid": 4183441, "tid": 31362, + "ts": 676008263598.995, "dur": 588.707, + "args": { + "External id": 450448,"Record function id": 0, "Ev Idx": 3983 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 4183441, "tid": 31362, + "ts": 676008263614.688, "dur": 560.958, + "args": { + "External id": 450449,"Record function id": 0, "Ev Idx": 3984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008263716.762, "dur": 8.268, + "args": { + "External id": 450450,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008263740.466, "dur": 30.973, + "args": { + "External id": 450451,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 3986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263744.880, "dur": 1.621, + "args": { + "External id": 450452,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263751.284, "dur": 0.623, + "args": { + "External id": 450453,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263753.453, "dur": 0.510, + "args": { + "External id": 450454,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263755.769, "dur": 0.729, + "args": { + "External id": 450455,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263757.664, "dur": 0.170, + "args": { + "External id": 450456,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263759.094, "dur": 0.358, + "args": { + "External id": 450457,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263760.785, "dur": 0.334, + "args": { + "External id": 450458,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263763.138, "dur": 2.303, + "args": { + "External id": 450459,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263766.590, "dur": 0.443, + "args": { + "External id": 450460,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 3995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008263781.997, "dur": 33.190, + "args": { + "External id": 450461,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 3996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008263846.536, "dur": 95.567, + "args": { + "External id": 450462,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 3997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008263855.687, "dur": 4.104, + "args": { + "External id": 450463,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008263864.502, "dur": 9.842, + "args": { + "External id": 450464,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 3999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008263868.747, "dur": 5.180, + "args": { + "External id": 450465,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263871.943, "dur": 0.597, + "args": { + "External id": 450466,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008263881.048, "dur": 23.821, + "args": { + "External id": 450467,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263882.920, "dur": 0.380, + "args": { + "External id": 450468,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263884.610, "dur": 0.613, + "args": { + "External id": 450469,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263886.995, "dur": 0.770, + "args": { + "External id": 450470,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263888.989, "dur": 0.764, + "args": { + "External id": 450471,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263891.765, "dur": 2.506, + "args": { + "External id": 450472,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263895.616, "dur": 0.549, + "args": { + "External id": 450473,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263897.949, "dur": 0.646, + "args": { + "External id": 450474,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263899.783, "dur": 0.430, + "args": { + "External id": 450475,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008263902.088, "dur": 0.361, + "args": { + "External id": 450476,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008263915.811, "dur": 19.111, + "args": { + "External id": 450477,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008263985.698, "dur": 120.644, + "args": { + "External id": 450478,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008264009.650, "dur": 92.630, + "args": { + "External id": 450479,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4014, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008264018.758, "dur": 61.166, + "args": { + "External id": 450480,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008264123.450, "dur": 2.089, + "args": { + "External id": 450481,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4016, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008264202.418, "dur": 1601.991, + "args": { + "External id": 450482,"Sequence number": 5285396, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4017 + } + }, + { + "ph": "f", "id": 204, "pid": 4183441, "tid": 31362, "ts": 676008264202.418, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008264311.235, "dur": 100.083, + "args": { + "External id": 450483,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008264451.003, "dur": 37.479, + "args": { + "External id": 450484,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008264504.477, "dur": 41.010, + "args": { + "External id": 450485,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008264554.375, "dur": 27.406, + "args": { + "External id": 450486,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008264587.731, "dur": 33.375, + "args": { + "External id": 450487,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008264629.259, "dur": 61.774, + "args": { + "External id": 450488,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008264702.705, "dur": 35.600, + "args": { + "External id": 450489,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008264762.393, "dur": 25.054, + "args": { + "External id": 450490,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008264805.248, "dur": 29.031, + "args": { + "External id": 450491,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008264854.284, "dur": 19.265, + "args": { + "External id": 450492,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008264886.855, "dur": 14.158, + "args": { + "External id": 450493,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008264910.873, "dur": 39.890, + "args": { + "External id": 450494,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008264954.501, "dur": 32.393, + "args": { + "External id": 450495,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008265013.835, "dur": 192.953, + "args": { + "External id": 450496,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008265111.241, "dur": 7.406, + "args": { + "External id": 450497,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008265121.042, "dur": 4.074, + "args": { + "External id": 450498,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008265240.546, "dur": 27.645, + "args": { + "External id": 450499,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008265280.299, "dur": 14.476, + "args": { + "External id": 450500,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008265303.315, "dur": 54.339, + "args": { + "External id": 450501,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008265365.643, "dur": 36.162, + "args": { + "External id": 450502,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008265407.577, "dur": 28.711, + "args": { + "External id": 450503,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008265440.771, "dur": 29.500, + "args": { + "External id": 450504,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008265476.994, "dur": 27.458, + "args": { + "External id": 450505,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008265513.113, "dur": 30.804, + "args": { + "External id": 450506,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008265560.926, "dur": 21.463, + "args": { + "External id": 450507,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008265612.780, "dur": 28.561, + "args": { + "External id": 450508,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008265691.368, "dur": 19.620, + "args": { + "External id": 450509,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008265729.513, "dur": 16.471, + "args": { + "External id": 450510,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008265758.664, "dur": 15.044, + "args": { + "External id": 450511,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265846.647, "dur": 14.889, + "args": { + "External id": 450512,"Record function id": 0, "Ev Idx": 4047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265850.171, "dur": 10.548, + "args": { + "External id": 450513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265854.104, "dur": 5.694, + "args": { + "External id": 450514,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265855.695, "dur": 4.013, + "args": { + "External id": 450515,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265869.002, "dur": 5.472, + "args": { + "External id": 450516,"Record function id": 0, "Ev Idx": 4051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265870.981, "dur": 3.076, + "args": { + "External id": 450517,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265871.970, "dur": 1.657, + "args": { + "External id": 450518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265872.523, "dur": 1.031, + "args": { + "External id": 450519,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265877.607, "dur": 4.544, + "args": { + "External id": 450520,"Record function id": 0, "Ev Idx": 4055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265879.132, "dur": 2.590, + "args": { + "External id": 450521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265879.801, "dur": 1.330, + "args": { + "External id": 450522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265880.410, "dur": 0.639, + "args": { + "External id": 450523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265885.258, "dur": 5.541, + "args": { + "External id": 450524,"Record function id": 0, "Ev Idx": 4059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265886.758, "dur": 3.629, + "args": { + "External id": 450525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265887.521, "dur": 2.456, + "args": { + "External id": 450526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265887.853, "dur": 2.014, + "args": { + "External id": 450527,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265893.877, "dur": 5.000, + "args": { + "External id": 450528,"Record function id": 0, "Ev Idx": 4063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265895.662, "dur": 2.802, + "args": { + "External id": 450529,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265896.374, "dur": 1.545, + "args": { + "External id": 450530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265896.917, "dur": 0.923, + "args": { + "External id": 450531,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265901.869, "dur": 3.834, + "args": { + "External id": 450532,"Record function id": 0, "Ev Idx": 4067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265903.154, "dur": 2.157, + "args": { + "External id": 450533,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265903.643, "dur": 1.111, + "args": { + "External id": 450534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265904.144, "dur": 0.541, + "args": { + "External id": 450535,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265908.865, "dur": 4.364, + "args": { + "External id": 450536,"Record function id": 0, "Ev Idx": 4071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265910.218, "dur": 2.607, + "args": { + "External id": 450537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265910.899, "dur": 1.364, + "args": { + "External id": 450538,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265911.487, "dur": 0.680, + "args": { + "External id": 450539,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265916.225, "dur": 3.943, + "args": { + "External id": 450540,"Record function id": 0, "Ev Idx": 4075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265917.380, "dur": 2.358, + "args": { + "External id": 450541,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265918.182, "dur": 1.164, + "args": { + "External id": 450542,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265918.590, "dur": 0.664, + "args": { + "External id": 450543,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265926.759, "dur": 4.230, + "args": { + "External id": 450544,"Record function id": 0, "Ev Idx": 4079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008265928.502, "dur": 2.070, + "args": { + "External id": 450545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008265928.945, "dur": 1.226, + "args": { + "External id": 450546,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008265929.456, "dur": 0.621, + "args": { + "External id": 450547,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008265935.241, "dur": 14788.484, + "args": { + "External id": 450548,"Record function id": 0, "Sequence number": 5285395, "Fwd thread id": 1, "Ev Idx": 4083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008265936.424, "dur": 14778.270, + "args": { + "External id": 450549,"Sequence number": 5285395, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4084 + } + }, + { + "ph": "f", "id": 205, "pid": 4183441, "tid": 31362, "ts": 676008265936.424, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.3)", "pid": 4183441, "tid": 31362, + "ts": 676008265964.272, "dur": 39.559, + "args": { + "External id": 450550,"Record function id": 0, "Ev Idx": 4085 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.3)", "pid": 4183441, "tid": 31362, + "ts": 676008266011.819, "dur": 84.033, + "args": { + "External id": 450551,"Record function id": 0, "Ev Idx": 4086 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.3)", "pid": 4183441, "tid": 31362, + "ts": 676008266108.056, "dur": 14598.250, + "args": { + "External id": 450552,"Record function id": 0, "Ev Idx": 4087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008266199.574, "dur": 6.745, + "args": { + "External id": 450553,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008266216.645, "dur": 4.811, + "args": { + "External id": 450554,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008266235.083, "dur": 13787.201, + "args": { + "External id": 450555,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008266248.707, "dur": 13765.310, + "args": { + "External id": 450556,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008266269.645, "dur": 14.379, + "args": { + "External id": 450557,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008266288.595, "dur": 13691.997, + "args": { + "External id": 450558,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008266291.202, "dur": 13688.585, + "args": { + "External id": 450559,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008266295.314, "dur": 4.604, + "args": { + "External id": 450560,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008266313.770, "dur": 13662.926, + "args": { + "External id": 450561,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008280123.317, "dur": 9.794, + "args": { + "External id": 450562,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008280126.170, "dur": 6.342, + "args": { + "External id": 450563,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008280160.427, "dur": 249.354, + "args": { + "External id": 450564,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008280187.133, "dur": 218.746, + "args": { + "External id": 450565,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4100, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008280198.228, "dur": 202.957, + "args": { + "External id": 450566,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008280426.859, "dur": 1.811, + "args": { + "External id": 450567,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4102, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280476.749, "dur": 6.165, + "args": { + "External id": 450568,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280523.960, "dur": 1.849, + "args": { + "External id": 450569,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280540.633, "dur": 1.343, + "args": { + "External id": 450570,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280553.421, "dur": 2.970, + "args": { + "External id": 450571,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280567.779, "dur": 0.794, + "args": { + "External id": 450572,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280578.637, "dur": 0.698, + "args": { + "External id": 450573,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280590.797, "dur": 0.926, + "args": { + "External id": 450574,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280603.053, "dur": 2.724, + "args": { + "External id": 450575,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280615.228, "dur": 0.913, + "args": { + "External id": 450576,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008280739.529, "dur": 2593.742, + "args": { + "External id": 450577,"Record function id": 0, "Ev Idx": 4112 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.2)", "pid": 4183441, "tid": 31362, + "ts": 676008280758.244, "dur": 997.019, + "args": { + "External id": 450578,"Record function id": 0, "Ev Idx": 4113 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 4183441, "tid": 31362, + "ts": 676008280772.880, "dur": 292.519, + "args": { + "External id": 450579,"Record function id": 0, "Ev Idx": 4114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280854.378, "dur": 4.883, + "args": { + "External id": 450580,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280862.364, "dur": 1.368, + "args": { + "External id": 450581,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280865.749, "dur": 1.488, + "args": { + "External id": 450582,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280868.936, "dur": 1.034, + "args": { + "External id": 450583,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280871.404, "dur": 2.566, + "args": { + "External id": 450584,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280875.664, "dur": 1.084, + "args": { + "External id": 450585,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280878.569, "dur": 0.964, + "args": { + "External id": 450586,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280881.439, "dur": 0.807, + "args": { + "External id": 450587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280883.898, "dur": 1.017, + "args": { + "External id": 450588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008280886.744, "dur": 0.763, + "args": { + "External id": 450589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008280904.026, "dur": 135.669, + "args": { + "External id": 450590,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008280918.810, "dur": 116.813, + "args": { + "External id": 450591,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008280930.276, "dur": 12.982, + "args": { + "External id": 450592,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008280945.726, "dur": 59.362, + "args": { + "External id": 450593,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008280948.637, "dur": 56.046, + "args": { + "External id": 450594,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008280952.337, "dur": 5.871, + "args": { + "External id": 450595,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008280959.892, "dur": 44.149, + "args": { + "External id": 450596,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4131 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.1", "pid": 4183441, "tid": 31362, + "ts": 676008281173.215, "dur": 574.135, + "args": { + "External id": 450597,"Record function id": 0, "Ev Idx": 4132 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 4183441, "tid": 31362, + "ts": 676008281190.427, "dur": 543.733, + "args": { + "External id": 450598,"Record function id": 0, "Ev Idx": 4133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008281254.842, "dur": 7.375, + "args": { + "External id": 450599,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008281278.057, "dur": 28.335, + "args": { + "External id": 450600,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281282.351, "dur": 1.594, + "args": { + "External id": 450601,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281285.739, "dur": 0.927, + "args": { + "External id": 450602,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281287.574, "dur": 0.649, + "args": { + "External id": 450603,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281290.087, "dur": 0.491, + "args": { + "External id": 450604,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281292.027, "dur": 0.514, + "args": { + "External id": 450605,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281294.073, "dur": 0.513, + "args": { + "External id": 450606,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281297.773, "dur": 0.288, + "args": { + "External id": 450607,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281298.840, "dur": 2.474, + "args": { + "External id": 450608,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281303.172, "dur": 0.391, + "args": { + "External id": 450609,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008281316.623, "dur": 34.637, + "args": { + "External id": 450610,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008281381.555, "dur": 98.349, + "args": { + "External id": 450611,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008281391.424, "dur": 3.342, + "args": { + "External id": 450612,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008281399.508, "dur": 12.683, + "args": { + "External id": 450613,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008281403.352, "dur": 8.461, + "args": { + "External id": 450614,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281409.814, "dur": 0.786, + "args": { + "External id": 450615,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008281419.520, "dur": 27.497, + "args": { + "External id": 450616,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281420.837, "dur": 0.581, + "args": { + "External id": 450617,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281422.860, "dur": 0.305, + "args": { + "External id": 450618,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281424.354, "dur": 0.701, + "args": { + "External id": 450619,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281426.895, "dur": 0.756, + "args": { + "External id": 450620,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281429.110, "dur": 2.665, + "args": { + "External id": 450621,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281433.378, "dur": 0.474, + "args": { + "External id": 450622,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281435.295, "dur": 0.578, + "args": { + "External id": 450623,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281437.215, "dur": 0.565, + "args": { + "External id": 450624,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008281438.940, "dur": 0.533, + "args": { + "External id": 450625,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008281455.797, "dur": 17.503, + "args": { + "External id": 450626,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008281521.063, "dur": 105.046, + "args": { + "External id": 450627,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008281544.759, "dur": 78.248, + "args": { + "External id": 450628,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4163, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008281554.768, "dur": 64.129, + "args": { + "External id": 450629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008281641.010, "dur": 2.075, + "args": { + "External id": 450630,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4165, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008281763.804, "dur": 1551.245, + "args": { + "External id": 450631,"Sequence number": 5285394, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4166 + } + }, + { + "ph": "f", "id": 206, "pid": 4183441, "tid": 31362, "ts": 676008281763.804, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008281875.197, "dur": 98.760, + "args": { + "External id": 450632,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008282015.613, "dur": 37.712, + "args": { + "External id": 450633,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008282069.462, "dur": 58.108, + "args": { + "External id": 450634,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282140.272, "dur": 27.740, + "args": { + "External id": 450635,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282174.273, "dur": 34.896, + "args": { + "External id": 450636,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282217.763, "dur": 21.201, + "args": { + "External id": 450637,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282246.387, "dur": 29.327, + "args": { + "External id": 450638,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008282298.443, "dur": 23.068, + "args": { + "External id": 450639,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008282346.905, "dur": 25.679, + "args": { + "External id": 450640,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008282390.773, "dur": 19.482, + "args": { + "External id": 450641,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008282421.044, "dur": 15.568, + "args": { + "External id": 450642,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282445.821, "dur": 36.662, + "args": { + "External id": 450643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282485.536, "dur": 30.297, + "args": { + "External id": 450644,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008282541.005, "dur": 201.044, + "args": { + "External id": 450645,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008282614.029, "dur": 5.300, + "args": { + "External id": 450646,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008282621.097, "dur": 2.431, + "args": { + "External id": 450647,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008282777.398, "dur": 30.613, + "args": { + "External id": 450648,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008282818.967, "dur": 15.203, + "args": { + "External id": 450649,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282842.824, "dur": 53.564, + "args": { + "External id": 450650,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282902.387, "dur": 31.475, + "args": { + "External id": 450651,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282940.323, "dur": 28.188, + "args": { + "External id": 450652,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008282976.349, "dur": 28.482, + "args": { + "External id": 450653,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008283010.018, "dur": 27.692, + "args": { + "External id": 450654,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008283044.072, "dur": 28.591, + "args": { + "External id": 450655,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008283107.449, "dur": 40.622, + "args": { + "External id": 450656,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008283173.442, "dur": 26.457, + "args": { + "External id": 450657,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008283213.676, "dur": 14.712, + "args": { + "External id": 450658,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008283243.974, "dur": 13.304, + "args": { + "External id": 450659,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008283269.192, "dur": 15.327, + "args": { + "External id": 450660,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283354.076, "dur": 17.338, + "args": { + "External id": 450661,"Record function id": 0, "Ev Idx": 4196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283360.232, "dur": 10.280, + "args": { + "External id": 450662,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283364.256, "dur": 5.441, + "args": { + "External id": 450663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283365.626, "dur": 3.977, + "args": { + "External id": 450664,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283375.259, "dur": 4.255, + "args": { + "External id": 450665,"Record function id": 0, "Ev Idx": 4200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283376.429, "dur": 2.658, + "args": { + "External id": 450666,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283377.366, "dur": 1.294, + "args": { + "External id": 450667,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283377.860, "dur": 0.716, + "args": { + "External id": 450668,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283382.742, "dur": 4.134, + "args": { + "External id": 450669,"Record function id": 0, "Ev Idx": 4204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283383.920, "dur": 2.467, + "args": { + "External id": 450670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283384.456, "dur": 1.501, + "args": { + "External id": 450671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283384.910, "dur": 0.962, + "args": { + "External id": 450672,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283390.066, "dur": 4.061, + "args": { + "External id": 450673,"Record function id": 0, "Ev Idx": 4208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283391.066, "dur": 2.620, + "args": { + "External id": 450674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283391.795, "dur": 1.488, + "args": { + "External id": 450675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283392.290, "dur": 0.901, + "args": { + "External id": 450676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283397.190, "dur": 4.207, + "args": { + "External id": 450677,"Record function id": 0, "Ev Idx": 4212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283398.199, "dur": 2.744, + "args": { + "External id": 450678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283398.710, "dur": 1.829, + "args": { + "External id": 450679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283399.245, "dur": 1.195, + "args": { + "External id": 450680,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283404.408, "dur": 4.523, + "args": { + "External id": 450681,"Record function id": 0, "Ev Idx": 4216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283405.832, "dur": 2.666, + "args": { + "External id": 450682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283406.305, "dur": 1.613, + "args": { + "External id": 450683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283406.806, "dur": 1.019, + "args": { + "External id": 450684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283412.020, "dur": 4.976, + "args": { + "External id": 450685,"Record function id": 0, "Ev Idx": 4220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283413.521, "dur": 3.015, + "args": { + "External id": 450686,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283414.196, "dur": 1.788, + "args": { + "External id": 450687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283414.983, "dur": 0.934, + "args": { + "External id": 450688,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283419.967, "dur": 4.315, + "args": { + "External id": 450689,"Record function id": 0, "Ev Idx": 4224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283421.396, "dur": 2.464, + "args": { + "External id": 450690,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283421.915, "dur": 1.528, + "args": { + "External id": 450691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283422.463, "dur": 0.884, + "args": { + "External id": 450692,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283427.665, "dur": 4.172, + "args": { + "External id": 450693,"Record function id": 0, "Ev Idx": 4228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008283428.602, "dur": 2.801, + "args": { + "External id": 450694,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008283429.083, "dur": 1.843, + "args": { + "External id": 450695,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008283430.000, "dur": 0.833, + "args": { + "External id": 450696,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008283438.987, "dur": 14879.797, + "args": { + "External id": 450697,"Record function id": 0, "Sequence number": 5285393, "Fwd thread id": 1, "Ev Idx": 4232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008283440.750, "dur": 14868.739, + "args": { + "External id": 450698,"Sequence number": 5285393, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4233 + } + }, + { + "ph": "f", "id": 207, "pid": 4183441, "tid": 31362, "ts": 676008283440.750, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.2)", "pid": 4183441, "tid": 31362, + "ts": 676008283468.469, "dur": 37.637, + "args": { + "External id": 450699,"Record function id": 0, "Ev Idx": 4234 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.2)", "pid": 4183441, "tid": 31362, + "ts": 676008283513.272, "dur": 66.530, + "args": { + "External id": 450700,"Record function id": 0, "Ev Idx": 4235 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.2)", "pid": 4183441, "tid": 31362, + "ts": 676008283585.981, "dur": 14715.878, + "args": { + "External id": 450701,"Record function id": 0, "Ev Idx": 4236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008283709.792, "dur": 7.297, + "args": { + "External id": 450702,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008283727.814, "dur": 5.089, + "args": { + "External id": 450703,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008283751.006, "dur": 13831.313, + "args": { + "External id": 450704,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008283764.244, "dur": 13810.204, + "args": { + "External id": 450705,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008283793.647, "dur": 16.839, + "args": { + "External id": 450706,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008283815.191, "dur": 13726.535, + "args": { + "External id": 450707,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008283817.716, "dur": 13723.213, + "args": { + "External id": 450708,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008283821.929, "dur": 4.599, + "args": { + "External id": 450709,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008283828.279, "dur": 13709.381, + "args": { + "External id": 450710,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008297692.869, "dur": 9.564, + "args": { + "External id": 450711,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008297695.646, "dur": 6.187, + "args": { + "External id": 450712,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008297729.053, "dur": 288.594, + "args": { + "External id": 450713,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008297754.728, "dur": 258.417, + "args": { + "External id": 450714,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4249, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008297766.225, "dur": 242.171, + "args": { + "External id": 450715,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008298033.594, "dur": 1.998, + "args": { + "External id": 450716,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4251, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298102.525, "dur": 6.359, + "args": { + "External id": 450717,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298153.401, "dur": 1.892, + "args": { + "External id": 450718,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298170.272, "dur": 1.356, + "args": { + "External id": 450719,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298183.446, "dur": 1.199, + "args": { + "External id": 450720,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298195.389, "dur": 1.140, + "args": { + "External id": 450721,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298206.572, "dur": 1.340, + "args": { + "External id": 450722,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298218.209, "dur": 1.157, + "args": { + "External id": 450723,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298230.654, "dur": 1.311, + "args": { + "External id": 450724,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298242.449, "dur": 0.746, + "args": { + "External id": 450725,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008298333.699, "dur": 2601.427, + "args": { + "External id": 450726,"Record function id": 0, "Ev Idx": 4261 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.1)", "pid": 4183441, "tid": 31362, + "ts": 676008298352.733, "dur": 976.251, + "args": { + "External id": 450727,"Record function id": 0, "Ev Idx": 4262 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 4183441, "tid": 31362, + "ts": 676008298368.068, "dur": 327.497, + "args": { + "External id": 450728,"Record function id": 0, "Ev Idx": 4263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298448.765, "dur": 4.425, + "args": { + "External id": 450729,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298456.706, "dur": 1.595, + "args": { + "External id": 450730,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298460.273, "dur": 1.332, + "args": { + "External id": 450731,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298463.393, "dur": 1.073, + "args": { + "External id": 450732,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298466.354, "dur": 0.990, + "args": { + "External id": 450733,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298468.713, "dur": 1.220, + "args": { + "External id": 450734,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298471.643, "dur": 1.028, + "args": { + "External id": 450735,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298474.457, "dur": 1.219, + "args": { + "External id": 450736,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298477.484, "dur": 1.282, + "args": { + "External id": 450737,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008298480.151, "dur": 1.197, + "args": { + "External id": 450738,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008298498.605, "dur": 134.602, + "args": { + "External id": 450739,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008298513.522, "dur": 115.296, + "args": { + "External id": 450740,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008298525.475, "dur": 13.662, + "args": { + "External id": 450741,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008298541.909, "dur": 61.217, + "args": { + "External id": 450742,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008298544.526, "dur": 58.280, + "args": { + "External id": 450743,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298548.182, "dur": 6.210, + "args": { + "External id": 450744,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008298557.477, "dur": 44.638, + "args": { + "External id": 450745,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4280 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.0", "pid": 4183441, "tid": 31362, + "ts": 676008298790.946, "dur": 530.876, + "args": { + "External id": 450746,"Record function id": 0, "Ev Idx": 4281 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 4183441, "tid": 31362, + "ts": 676008298806.705, "dur": 502.774, + "args": { + "External id": 450747,"Record function id": 0, "Ev Idx": 4282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008298867.486, "dur": 6.088, + "args": { + "External id": 450748,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008298887.640, "dur": 25.415, + "args": { + "External id": 450749,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298891.909, "dur": 1.554, + "args": { + "External id": 450750,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298895.066, "dur": 1.297, + "args": { + "External id": 450751,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298897.374, "dur": 0.679, + "args": { + "External id": 450752,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298899.115, "dur": 1.027, + "args": { + "External id": 450753,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298902.101, "dur": 0.816, + "args": { + "External id": 450754,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298904.055, "dur": 0.606, + "args": { + "External id": 450755,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298905.716, "dur": 0.795, + "args": { + "External id": 450756,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298907.915, "dur": 0.554, + "args": { + "External id": 450757,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008298909.401, "dur": 0.733, + "args": { + "External id": 450758,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008298922.918, "dur": 28.721, + "args": { + "External id": 450759,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 31362, + "ts": 676008298982.920, "dur": 117.477, + "args": { + "External id": 450760,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008298992.622, "dur": 3.829, + "args": { + "External id": 450761,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 31362, + "ts": 676008299000.874, "dur": 10.129, + "args": { + "External id": 450762,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 31362, + "ts": 676008299004.868, "dur": 5.738, + "args": { + "External id": 450763,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299008.190, "dur": 1.239, + "args": { + "External id": 450764,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 31362, + "ts": 676008299020.103, "dur": 26.414, + "args": { + "External id": 450765,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299021.777, "dur": 0.894, + "args": { + "External id": 450766,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299023.923, "dur": 0.648, + "args": { + "External id": 450767,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299025.990, "dur": 0.623, + "args": { + "External id": 450768,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299027.933, "dur": 1.195, + "args": { + "External id": 450769,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299030.455, "dur": 0.727, + "args": { + "External id": 450770,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299032.230, "dur": 0.801, + "args": { + "External id": 450771,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299034.494, "dur": 0.557, + "args": { + "External id": 450772,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299036.181, "dur": 0.933, + "args": { + "External id": 450773,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008299038.415, "dur": 0.786, + "args": { + "External id": 450774,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 31362, + "ts": 676008299055.650, "dur": 22.082, + "args": { + "External id": 450775,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 31362, + "ts": 676008299146.363, "dur": 102.652, + "args": { + "External id": 450776,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008299169.155, "dur": 76.548, + "args": { + "External id": 450777,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4312, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 31362, + "ts": 676008299178.018, "dur": 63.636, + "args": { + "External id": 450778,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008299261.895, "dur": 2.125, + "args": { + "External id": 450779,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4314, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008299336.479, "dur": 1576.987, + "args": { + "External id": 450780,"Sequence number": 5285392, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4315 + } + }, + { + "ph": "f", "id": 208, "pid": 4183441, "tid": 31362, "ts": 676008299336.479, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008299447.655, "dur": 96.174, + "args": { + "External id": 450781,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008299583.271, "dur": 37.299, + "args": { + "External id": 450782,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008299636.839, "dur": 82.279, + "args": { + "External id": 450783,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008299734.956, "dur": 28.969, + "args": { + "External id": 450784,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008299771.000, "dur": 35.050, + "args": { + "External id": 450785,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008299812.633, "dur": 21.447, + "args": { + "External id": 450786,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008299841.793, "dur": 29.292, + "args": { + "External id": 450787,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008299896.138, "dur": 26.461, + "args": { + "External id": 450788,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008299939.236, "dur": 26.657, + "args": { + "External id": 450789,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008299985.659, "dur": 17.899, + "args": { + "External id": 450790,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008300015.679, "dur": 14.965, + "args": { + "External id": 450791,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300038.583, "dur": 34.813, + "args": { + "External id": 450792,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300077.036, "dur": 50.795, + "args": { + "External id": 450793,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008300158.683, "dur": 163.103, + "args": { + "External id": 450794,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008300233.148, "dur": 6.037, + "args": { + "External id": 450795,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008300241.375, "dur": 2.875, + "args": { + "External id": 450796,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008300354.172, "dur": 22.552, + "args": { + "External id": 450797,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008300387.903, "dur": 17.120, + "args": { + "External id": 450798,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300412.915, "dur": 47.122, + "args": { + "External id": 450799,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300465.795, "dur": 30.622, + "args": { + "External id": 450800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300502.966, "dur": 28.078, + "args": { + "External id": 450801,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300537.747, "dur": 28.902, + "args": { + "External id": 450802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300572.673, "dur": 28.425, + "args": { + "External id": 450803,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008300608.994, "dur": 28.357, + "args": { + "External id": 450804,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008300691.089, "dur": 28.508, + "args": { + "External id": 450805,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008300747.443, "dur": 35.192, + "args": { + "External id": 450806,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008300801.301, "dur": 17.765, + "args": { + "External id": 450807,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008300838.511, "dur": 15.879, + "args": { + "External id": 450808,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008300866.669, "dur": 15.903, + "args": { + "External id": 450809,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300959.544, "dur": 14.919, + "args": { + "External id": 450810,"Record function id": 0, "Ev Idx": 4345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300962.876, "dur": 10.756, + "args": { + "External id": 450811,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008300967.031, "dur": 5.705, + "args": { + "External id": 450812,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008300968.703, "dur": 3.942, + "args": { + "External id": 450813,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300978.304, "dur": 5.328, + "args": { + "External id": 450814,"Record function id": 0, "Ev Idx": 4349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300979.869, "dur": 3.337, + "args": { + "External id": 450815,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008300981.116, "dur": 1.644, + "args": { + "External id": 450816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008300981.626, "dur": 1.044, + "args": { + "External id": 450817,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300986.914, "dur": 4.320, + "args": { + "External id": 450818,"Record function id": 0, "Ev Idx": 4353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300988.215, "dur": 2.622, + "args": { + "External id": 450819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008300988.854, "dur": 1.552, + "args": { + "External id": 450820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008300989.274, "dur": 1.020, + "args": { + "External id": 450821,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300994.344, "dur": 4.390, + "args": { + "External id": 450822,"Record function id": 0, "Ev Idx": 4357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008300995.931, "dur": 2.429, + "args": { + "External id": 450823,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008300996.417, "dur": 1.531, + "args": { + "External id": 450824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008300996.677, "dur": 1.177, + "args": { + "External id": 450825,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301001.842, "dur": 7.276, + "args": { + "External id": 450826,"Record function id": 0, "Ev Idx": 4361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301003.150, "dur": 5.548, + "args": { + "External id": 450827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008301006.971, "dur": 1.330, + "args": { + "External id": 450828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008301007.331, "dur": 0.902, + "args": { + "External id": 450829,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301012.319, "dur": 3.906, + "args": { + "External id": 450830,"Record function id": 0, "Ev Idx": 4365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301013.525, "dur": 2.290, + "args": { + "External id": 450831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008301013.987, "dur": 1.435, + "args": { + "External id": 450832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008301014.654, "dur": 0.673, + "args": { + "External id": 450833,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301019.465, "dur": 4.675, + "args": { + "External id": 450834,"Record function id": 0, "Ev Idx": 4369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301020.823, "dur": 2.930, + "args": { + "External id": 450835,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008301021.284, "dur": 1.762, + "args": { + "External id": 450836,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008301022.011, "dur": 0.939, + "args": { + "External id": 450837,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301027.120, "dur": 3.512, + "args": { + "External id": 450838,"Record function id": 0, "Ev Idx": 4373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301028.084, "dur": 2.146, + "args": { + "External id": 450839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008301028.653, "dur": 1.192, + "args": { + "External id": 450840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008301029.013, "dur": 0.766, + "args": { + "External id": 450841,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301033.919, "dur": 3.903, + "args": { + "External id": 450842,"Record function id": 0, "Ev Idx": 4377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008301034.940, "dur": 2.480, + "args": { + "External id": 450843,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008301035.408, "dur": 1.580, + "args": { + "External id": 450844,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008301036.160, "dur": 0.733, + "args": { + "External id": 450845,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008301041.582, "dur": 14853.422, + "args": { + "External id": 450846,"Record function id": 0, "Sequence number": 5285391, "Fwd thread id": 1, "Ev Idx": 4381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008301043.033, "dur": 14843.773, + "args": { + "External id": 450847,"Sequence number": 5285391, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4382 + } + }, + { + "ph": "f", "id": 209, "pid": 4183441, "tid": 31362, "ts": 676008301043.033, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.1)", "pid": 4183441, "tid": 31362, + "ts": 676008301073.808, "dur": 54.202, + "args": { + "External id": 450848,"Record function id": 0, "Ev Idx": 4383 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.1)", "pid": 4183441, "tid": 31362, + "ts": 676008301137.138, "dur": 70.363, + "args": { + "External id": 450849,"Record function id": 0, "Ev Idx": 4384 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.1)", "pid": 4183441, "tid": 31362, + "ts": 676008301213.577, "dur": 14666.060, + "args": { + "External id": 450850,"Record function id": 0, "Ev Idx": 4385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008301297.857, "dur": 9.796, + "args": { + "External id": 450851,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008301317.602, "dur": 5.018, + "args": { + "External id": 450852,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008301335.987, "dur": 13877.102, + "args": { + "External id": 450853,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008301348.941, "dur": 13856.773, + "args": { + "External id": 450854,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008301374.993, "dur": 13.493, + "args": { + "External id": 450855,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008301392.860, "dur": 13777.824, + "args": { + "External id": 450856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008301396.095, "dur": 13773.848, + "args": { + "External id": 450857,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008301399.928, "dur": 4.830, + "args": { + "External id": 450858,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008301406.372, "dur": 13760.408, + "args": { + "External id": 450859,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008315299.371, "dur": 9.601, + "args": { + "External id": 450860,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008315302.573, "dur": 6.067, + "args": { + "External id": 450861,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008315335.513, "dur": 242.589, + "args": { + "External id": 450862,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008315361.149, "dur": 212.989, + "args": { + "External id": 450863,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4398, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008315372.468, "dur": 197.094, + "args": { + "External id": 450864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008315593.494, "dur": 2.306, + "args": { + "External id": 450865,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4400, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315644.570, "dur": 6.259, + "args": { + "External id": 450866,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315726.685, "dur": 2.738, + "args": { + "External id": 450867,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315745.779, "dur": 1.586, + "args": { + "External id": 450868,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315759.004, "dur": 1.090, + "args": { + "External id": 450869,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315771.650, "dur": 1.152, + "args": { + "External id": 450870,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315783.633, "dur": 1.205, + "args": { + "External id": 450871,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315795.580, "dur": 1.306, + "args": { + "External id": 450872,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315808.236, "dur": 1.042, + "args": { + "External id": 450873,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008315819.075, "dur": 1.361, + "args": { + "External id": 450874,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008315909.983, "dur": 2009.375, + "args": { + "External id": 450875,"Record function id": 0, "Ev Idx": 4410 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.0)", "pid": 4183441, "tid": 31362, + "ts": 676008315929.070, "dur": 431.410, + "args": { + "External id": 450876,"Record function id": 0, "Ev Idx": 4411 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 4183441, "tid": 31362, + "ts": 676008315942.911, "dur": 316.326, + "args": { + "External id": 450877,"Record function id": 0, "Ev Idx": 4412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316030.308, "dur": 4.206, + "args": { + "External id": 450878,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316037.303, "dur": 1.190, + "args": { + "External id": 450879,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316040.358, "dur": 1.062, + "args": { + "External id": 450880,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316043.099, "dur": 0.892, + "args": { + "External id": 450881,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316045.603, "dur": 1.143, + "args": { + "External id": 450882,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316048.217, "dur": 1.157, + "args": { + "External id": 450883,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316051.094, "dur": 1.252, + "args": { + "External id": 450884,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316054.556, "dur": 0.914, + "args": { + "External id": 450885,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316057.137, "dur": 1.383, + "args": { + "External id": 450886,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008316060.231, "dur": 1.237, + "args": { + "External id": 450887,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008316077.651, "dur": 152.494, + "args": { + "External id": 450888,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 31362, + "ts": 676008316107.781, "dur": 117.979, + "args": { + "External id": 450889,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008316120.005, "dur": 13.102, + "args": { + "External id": 450890,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008316135.765, "dur": 62.501, + "args": { + "External id": 450891,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008316139.444, "dur": 58.524, + "args": { + "External id": 450892,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008316142.984, "dur": 6.128, + "args": { + "External id": 450893,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008316150.771, "dur": 46.642, + "args": { + "External id": 450894,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008316367.376, "dur": 1529.433, + "args": { + "External id": 450895,"Sequence number": 5285390, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4430 + } + }, + { + "ph": "f", "id": 210, "pid": 4183441, "tid": 31362, "ts": 676008316367.376, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008316473.658, "dur": 95.717, + "args": { + "External id": 450896,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [2816, 1], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 4183441, "tid": 31362, + "ts": 676008316607.495, "dur": 37.421, + "args": { + "External id": 450897,"kernel_hash": "cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/qi/cqi3my7gniuzhkkicbmpu2ehufs4cfdw5bbb2xcgrnxwaumtxecr.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [65536, 2816], [16, 4096, 2816], [16, 4096, 2816], [16, 4096, 2816], []], "Ev Idx": 4432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 4183441, "tid": 31362, + "ts": 676008316704.851, "dur": 51.312, + "args": { + "External id": 450898,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 1024], [0, 2816, 1], [2883584, 2816, 1]], "Input Dims": [[1, 1024, 65536], [1, 65536, 2816], [1, 1024, 2816]], "Ev Idx": 4433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008316766.615, "dur": 27.541, + "args": { + "External id": 450899,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008316803.657, "dur": 33.815, + "args": { + "External id": 450900,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008316844.895, "dur": 20.060, + "args": { + "External id": 450901,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2816], [1024, 1], [1024, 1]], "Input Dims": [[2816, 65536], [65536, 1024], [2816, 1024]], "Ev Idx": 4436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008316873.604, "dur": 29.160, + "args": { + "External id": 450902,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 4183441, "tid": 31362, + "ts": 676008316927.177, "dur": 21.221, + "args": { + "External id": 450903,"kernel_hash": "cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/yr/cyrwxjdbvwf6akucu4niv2g5z23fqa7njihpx3zbqtlpr2t5ekyv.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 4438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 4183441, "tid": 31362, + "ts": 676008316966.161, "dur": 26.409, + "args": { + "External id": 450904,"kernel_hash": "ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctdy2xnswudjzaudqvsfvpsbw3l6ecqdeqjvat2ogv3qlc2ewke6.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008317013.774, "dur": 17.105, + "args": { + "External id": 450905,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008317043.614, "dur": 13.532, + "args": { + "External id": 450906,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317064.429, "dur": 56.210, + "args": { + "External id": 450907,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317125.985, "dur": 34.234, + "args": { + "External id": 450908,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 4183441, "tid": 31362, + "ts": 676008317190.465, "dur": 168.704, + "args": { + "External id": 450909,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [65536, 4096, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 16, 4096], [16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008317266.657, "dur": 6.465, + "args": { + "External id": 450910,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008317274.842, "dur": 3.565, + "args": { + "External id": 450911,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008317391.173, "dur": 26.292, + "args": { + "External id": 450912,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 31362, + "ts": 676008317428.414, "dur": 14.177, + "args": { + "External id": 450913,"kernel_hash": "cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/y7/cy7h7rraavoyniiun6rhu3ukjttf5o3ywelevnp36yqb5lof43te.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317450.286, "dur": 42.508, + "args": { + "External id": 450914,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317498.841, "dur": 30.807, + "args": { + "External id": 450915,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317535.607, "dur": 28.610, + "args": { + "External id": 450916,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317569.914, "dur": 28.326, + "args": { + "External id": 450917,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317603.524, "dur": 28.227, + "args": { + "External id": 450918,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 1024], [1024, 1], [1024, 1]], "Input Dims": [[1024, 65536], [65536, 1024], [1024, 1024]], "Ev Idx": 4453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 31362, + "ts": 676008317639.726, "dur": 66.029, + "args": { + "External id": 450919,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 4183441, "tid": 31362, + "ts": 676008317727.808, "dur": 21.088, + "args": { + "External id": 450920,"kernel_hash": "cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/oj/cojarcqspnjaqqw544b46gfj3ciyo57yqmzl62c7cueoi3y2bf27.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [65536, 1024], []], "Ev Idx": 4455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 4183441, "tid": 31362, + "ts": 676008317765.902, "dur": 22.455, + "args": { + "External id": 450921,"kernel_hash": "cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "1024", "1", "497", "132", "True", "1024", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/og/cogn37vjityfw5rcbmxxj6lgjwku7e3fa4fzif3k6wsbvsso35lu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [1024], [65536, 1024], [65536, 1024], [132, 1024], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 4183441, "tid": 31362, + "ts": 676008317801.099, "dur": 15.638, + "args": { + "External id": 450922,"kernel_hash": "c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "66"], "kernel_file": "/tmp/torchinductor_cvm/2t/c2tdqs4z5s2g7idtrlju22bmvlps3pfj3xmgtvzdb57pcy33gyuy.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [2048, 1, 1024], [], []], "Input Dims": [[132, 1024], [1, 1024, 2], [], []], "Ev Idx": 4457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 4183441, "tid": 31362, + "ts": 676008317829.803, "dur": 13.332, + "args": { + "External id": 450923,"kernel_hash": "c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq", "grid": "grid(1024,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "1024", "2"], "kernel_file": "/tmp/torchinductor_cvm/6b/c6bjioivs352u3y5eynatbjzxhmlyx2tgr5gaf7rtuqzkxo53wmq.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1, 1024], [1024, 1], [], []], "Input Dims": [[1, 1024, 2], [1, 1024], [], []], "Ev Idx": 4458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 4183441, "tid": 31362, + "ts": 676008317855.512, "dur": 14.110, + "args": { + "External id": 450924,"kernel_hash": "c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/5r/c5ryb2lnaqdhzttpdyhpq75wbuzpfvqr6nrxfday4u3g2nimqwqm.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], [16, 4096, 1024], []], "Ev Idx": 4459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317940.142, "dur": 20.005, + "args": { + "External id": 450925,"Record function id": 0, "Ev Idx": 4460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317947.122, "dur": 12.069, + "args": { + "External id": 450926,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008317951.320, "dur": 7.048, + "args": { + "External id": 450927,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008317952.783, "dur": 5.477, + "args": { + "External id": 450928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317963.859, "dur": 5.165, + "args": { + "External id": 450929,"Record function id": 0, "Ev Idx": 4464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317965.215, "dur": 3.366, + "args": { + "External id": 450930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008317966.075, "dur": 1.879, + "args": { + "External id": 450931,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008317966.594, "dur": 1.244, + "args": { + "External id": 450932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317972.226, "dur": 5.600, + "args": { + "External id": 450933,"Record function id": 0, "Ev Idx": 4468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317974.140, "dur": 3.262, + "args": { + "External id": 450934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008317975.098, "dur": 1.723, + "args": { + "External id": 450935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008317975.674, "dur": 1.067, + "args": { + "External id": 450936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1024]], "Ev Idx": 4471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317981.053, "dur": 5.231, + "args": { + "External id": 450937,"Record function id": 0, "Ev Idx": 4472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317983.201, "dur": 2.685, + "args": { + "External id": 450938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008317984.384, "dur": 1.077, + "args": { + "External id": 450939,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008317984.655, "dur": 0.729, + "args": { + "External id": 450940,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 4475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317989.339, "dur": 4.107, + "args": { + "External id": 450941,"Record function id": 0, "Ev Idx": 4476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317990.778, "dur": 2.241, + "args": { + "External id": 450942,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008317991.252, "dur": 1.274, + "args": { + "External id": 450943,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008317991.664, "dur": 0.797, + "args": { + "External id": 450944,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317996.466, "dur": 9.035, + "args": { + "External id": 450945,"Record function id": 0, "Ev Idx": 4480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008317998.261, "dur": 6.814, + "args": { + "External id": 450946,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008317999.358, "dur": 5.305, + "args": { + "External id": 450947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008318000.136, "dur": 4.462, + "args": { + "External id": 450948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008318008.598, "dur": 5.174, + "args": { + "External id": 450949,"Record function id": 0, "Ev Idx": 4484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008318009.992, "dur": 3.368, + "args": { + "External id": 450950,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008318011.212, "dur": 1.758, + "args": { + "External id": 450951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008318011.725, "dur": 1.182, + "args": { + "External id": 450952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008318016.792, "dur": 5.650, + "args": { + "External id": 450953,"Record function id": 0, "Ev Idx": 4488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008318018.888, "dur": 3.152, + "args": { + "External id": 450954,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008318020.046, "dur": 1.450, + "args": { + "External id": 450955,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008318020.683, "dur": 0.745, + "args": { + "External id": 450956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 4491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008318025.600, "dur": 3.824, + "args": { + "External id": 450957,"Record function id": 0, "Ev Idx": 4492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008318026.765, "dur": 2.235, + "args": { + "External id": 450958,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008318027.264, "dur": 1.320, + "args": { + "External id": 450959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008318027.556, "dur": 0.961, + "args": { + "External id": 450960,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 4495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008318033.465, "dur": 15603.944, + "args": { + "External id": 450961,"Record function id": 0, "Sequence number": 5285389, "Fwd thread id": 1, "Ev Idx": 4496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008318035.063, "dur": 15594.587, + "args": { + "External id": 450962,"Sequence number": 5285389, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4497 + } + }, + { + "ph": "f", "id": 211, "pid": 4183441, "tid": 31362, "ts": 676008318035.063, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.0)", "pid": 4183441, "tid": 31362, + "ts": 676008318061.610, "dur": 83.330, + "args": { + "External id": 450963,"Record function id": 0, "Ev Idx": 4498 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.0)", "pid": 4183441, "tid": 31362, + "ts": 676008318154.666, "dur": 80.105, + "args": { + "External id": 450964,"Record function id": 0, "Ev Idx": 4499 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.0)", "pid": 4183441, "tid": 31362, + "ts": 676008318240.723, "dur": 15381.460, + "args": { + "External id": 450965,"Record function id": 0, "Ev Idx": 4500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008318342.334, "dur": 12.158, + "args": { + "External id": 450966,"Record function id": 0, "Concrete Inputs": ["[12847104]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008318365.578, "dur": 5.580, + "args": { + "External id": 450967,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008318384.566, "dur": 14533.080, + "args": { + "External id": 450968,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008318398.002, "dur": 14512.561, + "args": { + "External id": 450969,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [1024, 1], [1024, 1], [1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], [], [], [1605888, 1]], "Input Dims": [[[1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], [], [], [8, 1605888]], "Ev Idx": 4504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008318423.564, "dur": 14.249, + "args": { + "External id": 450970,"Record function id": 0, "Concrete Inputs": ["[3194]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008318446.013, "dur": 14431.109, + "args": { + "External id": 450971,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], [], []], "Ev Idx": 4506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008318448.385, "dur": 14428.030, + "args": { + "External id": 450972,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3194], [], [], [], [], [], []], "Ev Idx": 4507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008318452.126, "dur": 5.804, + "args": { + "External id": 450973,"Record function id": 0, "Concrete Inputs": ["[3194]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008318459.506, "dur": 14413.299, + "args": { + "External id": 450974,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3194], [3194], []], "Ev Idx": 4509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008333000.959, "dur": 9.294, + "args": { + "External id": 450975,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[12847104], [], [], [], [], []], "Ev Idx": 4510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008333003.918, "dur": 6.052, + "args": { + "External id": 450976,"Record function id": 0, "Concrete Inputs": ["[1605888]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008333036.838, "dur": 309.428, + "args": { + "External id": 450977,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[1605888], [12847104], [], [], [], []], "Ev Idx": 4512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008333061.967, "dur": 279.395, + "args": { + "External id": 450978,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1605888, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[12847104], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4513, "In msg nelems": 12847104 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008333073.768, "dur": 262.037, + "args": { + "External id": 450979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[12847104]], "Ev Idx": 4514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008333364.735, "dur": 2.188, + "args": { + "External id": 450980,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4515, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333422.012, "dur": 6.499, + "args": { + "External id": 450981,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333470.585, "dur": 1.409, + "args": { + "External id": 450982,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333488.975, "dur": 1.661, + "args": { + "External id": 450983,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "131200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333503.315, "dur": 1.006, + "args": { + "External id": 450984,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "262272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333515.961, "dur": 1.048, + "args": { + "External id": 450985,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "393344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333527.227, "dur": 1.153, + "args": { + "External id": 450986,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333538.916, "dur": 1.183, + "args": { + "External id": 450987,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333550.781, "dur": 1.139, + "args": { + "External id": 450988,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "884992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008333562.252, "dur": 0.975, + "args": { + "External id": 450989,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "1245440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008333651.107, "dur": 307.209, + "args": { + "External id": 450990,"Record function id": 0, "Sequence number": 5285388, "Fwd thread id": 1, "Ev Idx": 4525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 4183441, "tid": 31362, + "ts": 676008333688.197, "dur": 260.600, + "args": { + "External id": 450991,"Sequence number": 5285388, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4526 + } + }, + { + "ph": "f", "id": 212, "pid": 4183441, "tid": 31362, "ts": 676008333688.197, + "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_0", "pid": 4183441, "tid": 31362, + "ts": 676008333807.518, "dur": 43.818, + "args": { + "External id": 450992,"kernel_hash": "ciudretdwvj3qhmlixt4kkn5h73gwbliauiw4z4335ftxisnls4m", "grid": "grid(32768000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "32768000"], "kernel_file": "/tmp/torchinductor_cvm/iu/ciudretdwvj3qhmlixt4kkn5h73gwbliauiw4z4335ftxisnls4m.py", "kernel_backend": "triton", "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 4527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_1", "pid": 4183441, "tid": 31362, + "ts": 676008333868.025, "dur": 28.367, + "args": { + "External id": 450993,"kernel_hash": "crggdtu4kcao75se52mde77tryesutqc4y7eq2pfkr2gezmqlp5w", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/rg/crggdtu4kcao75se52mde77tryesutqc4y7eq2pfkr2gezmqlp5w.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "float", "Scalar"], "Input Strides": [[4096, 1], [4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096], [16, 4096, 1024], [32000, 1024], []], "Ev Idx": 4528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_2", "pid": 4183441, "tid": 31362, + "ts": 676008333912.279, "dur": 20.615, + "args": { + "External id": 450994,"kernel_hash": "cax2yoq4h5h6n6iitjhflmelobmft3hhrwz5mgohpe6jv74eyand", "grid": "grid(32768000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "32768000"], "kernel_file": "/tmp/torchinductor_cvm/ax/cax2yoq4h5h6n6iitjhflmelobmft3hhrwz5mgohpe6jv74eyand.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 4529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008333969.762, "dur": 15.988, + "args": { + "External id": 450995,"Record function id": 0, "Ev Idx": 4530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 4183441, "tid": 31362, + "ts": 676008333973.471, "dur": 11.401, + "args": { + "External id": 450996,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 4531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 31362, + "ts": 676008333977.254, "dur": 6.797, + "args": { + "External id": 450997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 4532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 31362, + "ts": 676008333978.748, "dur": 5.203, + "args": { + "External id": 450998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 4533 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::root_post_backward_callback", "pid": 4183441, "tid": 31362, + "ts": 676008334009.623, "dur": 6734.924, + "args": { + "External id": 450999,"Record function id": 0, "Ev Idx": 4534 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate", "pid": 4183441, "tid": 31362, + "ts": 676008334028.091, "dur": 38.255, + "args": { + "External id": 451000,"Record function id": 0, "Ev Idx": 4535 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard", "pid": 4183441, "tid": 31362, + "ts": 676008334072.555, "dur": 293.861, + "args": { + "External id": 451001,"Record function id": 0, "Ev Idx": 4536 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce", "pid": 4183441, "tid": 31362, + "ts": 676008334373.758, "dur": 6121.962, + "args": { + "External id": 451002,"Record function id": 0, "Ev Idx": 4537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008334491.853, "dur": 7.540, + "args": { + "External id": 451003,"Record function id": 0, "Concrete Inputs": ["[116925440]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 31362, + "ts": 676008334509.816, "dur": 5.254, + "args": { + "External id": 451004,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[116925440], []], "Ev Idx": 4539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008334532.542, "dur": 4691.123, + "args": { + "External id": 451005,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [14615680, 1]], "Input Dims": [[], [], [], [8, 14615680]], "Ev Idx": 4540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 4183441, "tid": 31362, + "ts": 676008334552.869, "dur": 4660.124, + "args": { + "External id": 451006,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [14615680, 1]], "Input Dims": [[], [], [], [8, 14615680]], "Ev Idx": 4541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008334687.446, "dur": 13.920, + "args": { + "External id": 451007,"Record function id": 0, "Concrete Inputs": ["[28789]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 31362, + "ts": 676008334734.278, "dur": 4440.023, + "args": { + "External id": 451008,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[28789], [], [], [], [], [], [], []], "Ev Idx": 4543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 31362, + "ts": 676008334737.791, "dur": 4435.886, + "args": { + "External id": 451009,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[28789], [], [], [], [], [], []], "Ev Idx": 4544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 31362, + "ts": 676008334741.545, "dur": 7.188, + "args": { + "External id": 451010,"Record function id": 0, "Concrete Inputs": ["[28789]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 31362, + "ts": 676008334750.267, "dur": 4419.898, + "args": { + "External id": 451011,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[28789], [28789], []], "Ev Idx": 4546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 31362, + "ts": 676008339339.993, "dur": 9.172, + "args": { + "External id": 451012,"Record function id": 0, "Concrete Inputs": ["", "[14615680]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[116925440], [], [], [], [], []], "Ev Idx": 4547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 31362, + "ts": 676008339342.889, "dur": 5.920, + "args": { + "External id": 451013,"Record function id": 0, "Concrete Inputs": ["[14615680]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 4183441, "tid": 31362, + "ts": 676008339377.444, "dur": 465.861, + "args": { + "External id": 451014,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[14615680], [116925440], [], [], [], []], "Ev Idx": 4549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008339401.695, "dur": 436.197, + "args": { + "External id": 451015,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 14615680, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[116925440], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4550, "In msg nelems": 116925440 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 4183441, "tid": 31362, + "ts": 676008339412.752, "dur": 419.693, + "args": { + "External id": 451016,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[116925440]], "Ev Idx": 4551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 31362, + "ts": 676008339866.743, "dur": 2.231, + "args": { + "External id": 451017,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4552, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008339927.492, "dur": 6.653, + "args": { + "External id": 451018,"Record function id": 0, "Concrete Inputs": ["", "[4000, 1024]", "[1024, 1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008339976.243, "dur": 1.476, + "args": { + "External id": 451019,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4096000"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008339993.002, "dur": 1.460, + "args": { + "External id": 451020,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4096128"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340006.233, "dur": 1.231, + "args": { + "External id": 451021,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4227200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340017.963, "dur": 1.439, + "args": { + "External id": 451022,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4358272"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340029.299, "dur": 1.507, + "args": { + "External id": 451023,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "4489344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340040.368, "dur": 1.465, + "args": { + "External id": 451024,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4620416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340052.058, "dur": 1.158, + "args": { + "External id": 451025,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "4620544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340063.944, "dur": 1.487, + "args": { + "External id": 451026,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "4980992"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340075.533, "dur": 1.317, + "args": { + "External id": 451027,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "5341440"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340106.181, "dur": 2.180, + "args": { + "External id": 451028,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "5701888"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340119.595, "dur": 1.881, + "args": { + "External id": 451029,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "5702016"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340131.308, "dur": 1.353, + "args": { + "External id": 451030,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "5833088"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340142.185, "dur": 1.152, + "args": { + "External id": 451031,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "5964160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340152.440, "dur": 1.565, + "args": { + "External id": 451032,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "6095232"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340163.814, "dur": 1.672, + "args": { + "External id": 451033,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "6226304"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340175.659, "dur": 1.439, + "args": { + "External id": 451034,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "6226432"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340187.373, "dur": 1.545, + "args": { + "External id": 451035,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "6586880"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340199.465, "dur": 1.473, + "args": { + "External id": 451036,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "6947328"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340211.610, "dur": 1.194, + "args": { + "External id": 451037,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7307776"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340224.112, "dur": 1.313, + "args": { + "External id": 451038,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7307904"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340236.320, "dur": 1.567, + "args": { + "External id": 451039,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7438976"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340249.625, "dur": 0.979, + "args": { + "External id": 451040,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7570048"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340261.560, "dur": 1.621, + "args": { + "External id": 451041,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "7701120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340272.976, "dur": 1.146, + "args": { + "External id": 451042,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7832192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340284.921, "dur": 1.122, + "args": { + "External id": 451043,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "7832320"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340296.195, "dur": 1.551, + "args": { + "External id": 451044,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "8192768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340307.778, "dur": 1.315, + "args": { + "External id": 451045,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "8553216"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340319.625, "dur": 1.577, + "args": { + "External id": 451046,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8913664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340331.060, "dur": 1.511, + "args": { + "External id": 451047,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "8913792"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340343.041, "dur": 1.340, + "args": { + "External id": 451048,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "9044864"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340354.533, "dur": 1.483, + "args": { + "External id": 451049,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "9175936"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340366.279, "dur": 1.463, + "args": { + "External id": 451050,"Record function id": 0, "Concrete Inputs": ["", "[128, 1024]", "[1024, 1]", "9307008"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340377.380, "dur": 1.290, + "args": { + "External id": 451051,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9438080"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340388.606, "dur": 1.302, + "args": { + "External id": 451052,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "9438208"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340399.656, "dur": 1.283, + "args": { + "External id": 451053,"Record function id": 0, "Concrete Inputs": ["", "[352, 1024]", "[1024, 1]", "9798656"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340411.017, "dur": 1.265, + "args": { + "External id": 451054,"Record function id": 0, "Concrete Inputs": ["", "[128, 2816]", "[2816, 1]", "10159104"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340422.168, "dur": 1.502, + "args": { + "External id": 451055,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10519552"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 31362, + "ts": 676008340434.379, "dur": 1.393, + "args": { + "External id": 451056,"Record function id": 0, "Concrete Inputs": ["", "[4000, 1024]", "[1024, 1]", "10519680"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4591 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "ProfilerStep#23551", "pid": 4183441, "tid": 4183441, + "ts": 676007567806.807, "dur": 788183.512, + "args": { + "External id": 442369,"Record function id": 0, "Ev Idx": 4592 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "Optimizer.zero_grad#AdamW.zero_grad", "pid": 4183441, "tid": 4183441, + "ts": 676007567840.422, "dur": 491.844, + "args": { + "External id": 442370,"Record function id": 0, "Ev Idx": 4593 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "enumerate(DataLoader)#_StatefulMultiProcessingDataLoaderIter.__next__", "pid": 4183441, "tid": 4183441, + "ts": 676007568373.907, "dur": 2113.492, + "args": { + "External id": 442371,"Record function id": 0, "Ev Idx": 4594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007569503.277, "dur": 8.437, + "args": { + "External id": 442372,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 4183441, "tid": 4183441, + "ts": 676007569531.987, "dur": 6.807, + "args": { + "External id": 442373,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 4596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007569976.306, "dur": 2.266, + "args": { + "External id": 442374,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 4183441, "tid": 4183441, + "ts": 676007569987.140, "dur": 2.731, + "args": { + "External id": 442375,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 4598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007570365.621, "dur": 1.798, + "args": { + "External id": 442376,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 4183441, "tid": 4183441, + "ts": 676007570374.443, "dur": 1.935, + "args": { + "External id": 442377,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 4600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007570918.727, "dur": 14.136, + "args": { + "External id": 442378,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 4601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007570926.516, "dur": 2.568, + "args": { + "External id": 442379,"Record function id": 0, "Concrete Inputs": ["", "[16, 8192]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 4602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007570934.508, "dur": 4.597, + "args": { + "External id": 442380,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 4603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007570936.944, "dur": 1.143, + "args": { + "External id": 442381,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 4604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007570966.768, "dur": 521.607, + "args": { + "External id": 442382,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], [], []], "Ev Idx": 4605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007570974.501, "dur": 512.830, + "args": { + "External id": 442383,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 4606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007570983.752, "dur": 9.656, + "args": { + "External id": 442384,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007570995.961, "dur": 489.893, + "args": { + "External id": 442385,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007571005.755, "dur": 0.470, + "args": { + "External id": 442386,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 4609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 4183441, "tid": 4183441, + "ts": 676007571008.697, "dur": 8.914, + "args": { + "External id": 442387,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[8192, 1], [4096, 1]], "Input Dims": [[16, 4096], [16, 4096]], "Ev Idx": 4610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 4183441, "tid": 4183441, + "ts": 676007571013.598, "dur": 3.730, + "args": { + "External id": 442388,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], []], "Input Dims": [[16, 4096], [], []], "Ev Idx": 4611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007571016.295, "dur": 0.669, + "args": { + "External id": 442389,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 4612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007571019.813, "dur": 201.012, + "args": { + "External id": 442390,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 4613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007571022.427, "dur": 198.067, + "args": { + "External id": 442391,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 4614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007571025.030, "dur": 14.296, + "args": { + "External id": 442392,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 4615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007571027.258, "dur": 11.544, + "args": { + "External id": 442393,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007571040.194, "dur": 179.225, + "args": { + "External id": 442394,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007571223.661, "dur": 258.741, + "args": { + "External id": 442395,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007571505.792, "dur": 681.365, + "args": { + "External id": 442396,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 4619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007571507.697, "dur": 678.594, + "args": { + "External id": 442397,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], []], "Ev Idx": 4620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007571515.252, "dur": 7.604, + "args": { + "External id": 442398,"Record function id": 0, "Concrete Inputs": ["[16, 8192]", "[8192, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007571523.804, "dur": 654.759, + "args": { + "External id": 442399,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[8192, 1], [8192, 1], []], "Input Dims": [[16, 8192], [16, 8192], []], "Ev Idx": 4622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 4183441, "tid": 4183441, + "ts": 676007572234.252, "dur": 77.017, + "args": { + "External id": 442400,"Record function id": 0, "Concrete Inputs": ["0", "4096", "", "", "", "False"], "Input type": ["Scalar", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007572240.867, "dur": 7.756, + "args": { + "External id": 442401,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 4183441, "tid": 4183441, + "ts": 676007572252.238, "dur": 57.286, + "args": { + "External id": 442402,"Record function id": 0, "Concrete Inputs": ["0", "4096", "1", ""], "Input type": ["Scalar", "Scalar", "Scalar", "long int"], "Input Strides": [[], [], [], [1]], "Input Dims": [[], [], [], [0]], "Ev Idx": 4625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007572257.552, "dur": 7.353, + "args": { + "External id": 442403,"Record function id": 0, "Concrete Inputs": ["", "[4096]", ""], "Input type": ["long int", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 4626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::repeat", "pid": 4183441, "tid": 4183441, + "ts": 676007572339.670, "dur": 100.266, + "args": { + "External id": 442404,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4096], []], "Ev Idx": 4627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 4183441, "tid": 4183441, + "ts": 676007572344.630, "dur": 8.359, + "args": { + "External id": 442405,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[4096], [], []], "Ev Idx": 4628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007572349.981, "dur": 2.310, + "args": { + "External id": 442406,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "[4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[4096], [], [], []], "Ev Idx": 4629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007572354.182, "dur": 8.058, + "args": { + "External id": 442407,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 4183441, + "ts": 676007572366.874, "dur": 4.201, + "args": { + "External id": 442408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[4096, 1]], "Input Dims": [[16, 4096]], "Ev Idx": 4631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 4183441, "tid": 4183441, + "ts": 676007572373.819, "dur": 5.550, + "args": { + "External id": 442409,"Record function id": 0, "Concrete Inputs": ["", "0", "1", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 4632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007572378.510, "dur": 0.725, + "args": { + "External id": 442410,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1]", "[4096, 1, 4096]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 4633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 4183441, "tid": 4183441, + "ts": 676007572380.328, "dur": 17.396, + "args": { + "External id": 442411,"Record function id": 0, "Concrete Inputs": ["", "1", "4096", "4096"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 4634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007572384.825, "dur": 10.748, + "args": { + "External id": 442412,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[4096, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 4635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 4183441, "tid": 4183441, + "ts": 676007572401.565, "dur": 5.800, + "args": { + "External id": 442413,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[4096, 1], [4096, 4096, 4096, 1]], "Input Dims": [[1, 4096], [16, 1, 1, 4096]], "Ev Idx": 4636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 4183441, "tid": 4183441, + "ts": 676007572403.671, "dur": 3.583, + "args": { + "External id": 442414,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[4096, 1], [], []], "Input Dims": [[1, 4096], [], []], "Ev Idx": 4637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007572405.535, "dur": 1.563, + "args": { + "External id": 442415,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[0, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[1, 4096], [], [], []], "Ev Idx": 4638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007572408.567, "dur": 30.590, + "args": { + "External id": 442416,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 4096, 4096, 1], [0, 4096, 4096, 1], []], "Input Dims": [[16, 1, 1, 4096], [16, 1, 1, 4096], []], "Ev Idx": 4639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007572451.785, "dur": 72.952, + "args": { + "External id": 442417,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 4640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007572453.272, "dur": 71.148, + "args": { + "External id": 442418,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "", "", "", "False", ""], "Input type": ["long int", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 4641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007572474.703, "dur": 7.390, + "args": { + "External id": 442419,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "3", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007572483.790, "dur": 38.551, + "args": { + "External id": 442420,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 4643 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::root_pre_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007572644.797, "dur": 192.078, + "args": { + "External id": 442421,"Record function id": 0, "Ev Idx": 4644 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::inputs_to_device", "pid": 4183441, "tid": 4183441, + "ts": 676007572769.141, "dur": 57.975, + "args": { + "External id": 442422,"Record function id": 0, "Ev Idx": 4645 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007572843.796, "dur": 43.255, + "args": { + "External id": 442423,"Record function id": 0, "Ev Idx": 4646 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007572895.833, "dur": 7099.612, + "args": { + "External id": 442424,"Record function id": 0, "Ev Idx": 4647 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather", "pid": 4183441, "tid": 4183441, + "ts": 676007572905.135, "dur": 1327.346, + "args": { + "External id": 442425,"Record function id": 0, "Ev Idx": 4648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007573030.119, "dur": 7.414, + "args": { + "External id": 442426,"Record function id": 0, "Concrete Inputs": ["[14615680]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007573054.592, "dur": 157.861, + "args": { + "External id": 442427,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[14615680], [], []], "Ev Idx": 4650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573059.098, "dur": 1.707, + "args": { + "External id": 442428,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573067.293, "dur": 0.476, + "args": { + "External id": 442429,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4096000"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573068.627, "dur": 0.712, + "args": { + "External id": 442430,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4096128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573070.008, "dur": 2.688, + "args": { + "External id": 442431,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4227200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573077.828, "dur": 0.477, + "args": { + "External id": 442432,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4358272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573079.045, "dur": 0.634, + "args": { + "External id": 442433,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "4489344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573080.297, "dur": 15.994, + "args": { + "External id": 442434,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "4620416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573100.623, "dur": 0.367, + "args": { + "External id": 442435,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "4620544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573101.691, "dur": 0.444, + "args": { + "External id": 442436,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "4980992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573107.777, "dur": 0.368, + "args": { + "External id": 442437,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "5341440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573108.738, "dur": 0.379, + "args": { + "External id": 442438,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "5701888"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573110.030, "dur": 2.053, + "args": { + "External id": 442439,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "5702016"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573117.510, "dur": 0.426, + "args": { + "External id": 442440,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "5833088"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573118.571, "dur": 0.513, + "args": { + "External id": 442441,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "5964160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573119.844, "dur": 2.805, + "args": { + "External id": 442442,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "6095232"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573125.071, "dur": 0.336, + "args": { + "External id": 442443,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "6226304"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573126.228, "dur": 0.409, + "args": { + "External id": 442444,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "6226432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573132.026, "dur": 0.316, + "args": { + "External id": 442445,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "6586880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573133.065, "dur": 0.729, + "args": { + "External id": 442446,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "6947328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573134.431, "dur": 2.449, + "args": { + "External id": 442447,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7307776"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573142.120, "dur": 0.491, + "args": { + "External id": 442448,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7307904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573143.086, "dur": 0.834, + "args": { + "External id": 442449,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7438976"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573144.818, "dur": 2.917, + "args": { + "External id": 442450,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7570048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573150.402, "dur": 0.368, + "args": { + "External id": 442451,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "7701120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573151.532, "dur": 0.314, + "args": { + "External id": 442452,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "7832192"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573157.381, "dur": 0.261, + "args": { + "External id": 442453,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "7832320"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573158.361, "dur": 0.353, + "args": { + "External id": 442454,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8192768"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573159.405, "dur": 2.364, + "args": { + "External id": 442455,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573164.900, "dur": 0.234, + "args": { + "External id": 442456,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8913664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573165.940, "dur": 0.374, + "args": { + "External id": 442457,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8913792"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573166.880, "dur": 2.598, + "args": { + "External id": 442458,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9044864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573172.600, "dur": 0.565, + "args": { + "External id": 442459,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9175936"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573173.705, "dur": 0.352, + "args": { + "External id": 442460,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "9307008"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573179.555, "dur": 0.556, + "args": { + "External id": 442461,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "9438080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573180.694, "dur": 0.861, + "args": { + "External id": 442462,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9438208"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573182.274, "dur": 2.100, + "args": { + "External id": 442463,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9798656"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573187.706, "dur": 0.313, + "args": { + "External id": 442464,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "10159104"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573188.949, "dur": 0.402, + "args": { + "External id": 442465,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "10519552"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573189.956, "dur": 2.018, + "args": { + "External id": 442466,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "10519680"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007573241.991, "dur": 49.925, + "args": { + "External id": 442467,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 4690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007573376.654, "dur": 255.740, + "args": { + "External id": 442468,"Record function id": 0, "Concrete Inputs": ["", "", "14615680", "8", "5", "15", ""], "Input type": ["TensorList", "", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 4691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007573396.258, "dur": 5.494, + "args": { + "External id": 442469,"Record function id": 0, "Concrete Inputs": ["[116925440]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007573408.435, "dur": 13.424, + "args": { + "External id": 442470,"Record function id": 0, "Concrete Inputs": ["", "0", "73078400", "14615680"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[116925440], [], [], []], "Ev Idx": 4693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007573413.360, "dur": 8.081, + "args": { + "External id": 442471,"Record function id": 0, "Concrete Inputs": ["", "0", "73078400", "87694080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[116925440], [], [], [], []], "Ev Idx": 4694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573418.360, "dur": 0.812, + "args": { + "External id": 442472,"Record function id": 0, "Concrete Inputs": ["", "[14615680]", "[1]", "73078400"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[116925440], [], [], []], "Ev Idx": 4695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007573430.228, "dur": 126.939, + "args": { + "External id": 442473,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[14615680], [], []], "Ev Idx": 4696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573431.847, "dur": 0.636, + "args": { + "External id": 442474,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "73078400"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573433.616, "dur": 0.446, + "args": { + "External id": 442475,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "77174400"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573437.216, "dur": 2.465, + "args": { + "External id": 442476,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "77174528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573440.523, "dur": 0.915, + "args": { + "External id": 442477,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "77305600"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573443.921, "dur": 0.557, + "args": { + "External id": 442478,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "77436672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573445.142, "dur": 0.424, + "args": { + "External id": 442479,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "77567744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573446.616, "dur": 0.551, + "args": { + "External id": 442480,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "77698816"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573449.765, "dur": 0.330, + "args": { + "External id": 442481,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "77698944"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573450.957, "dur": 0.976, + "args": { + "External id": 442482,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "78059392"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573452.552, "dur": 0.630, + "args": { + "External id": 442483,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "78419840"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573456.251, "dur": 2.006, + "args": { + "External id": 442484,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "78780288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573459.284, "dur": 0.380, + "args": { + "External id": 442485,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "78780416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573462.409, "dur": 2.371, + "args": { + "External id": 442486,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "78911488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573465.675, "dur": 0.396, + "args": { + "External id": 442487,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "79042560"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573466.643, "dur": 0.486, + "args": { + "External id": 442488,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "79173632"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573472.439, "dur": 0.162, + "args": { + "External id": 442489,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "79304704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573473.204, "dur": 0.696, + "args": { + "External id": 442490,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "79304832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573474.543, "dur": 0.274, + "args": { + "External id": 442491,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "79665280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573480.023, "dur": 1.589, + "args": { + "External id": 442492,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "80025728"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573482.213, "dur": 0.367, + "args": { + "External id": 442493,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "80386176"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573485.543, "dur": 2.359, + "args": { + "External id": 442494,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "80386304"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573488.747, "dur": 0.772, + "args": { + "External id": 442495,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "80517376"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573490.131, "dur": 0.513, + "args": { + "External id": 442496,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "80648448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573496.413, "dur": 0.377, + "args": { + "External id": 442497,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "80779520"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573497.348, "dur": 0.352, + "args": { + "External id": 442498,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "80910592"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573498.355, "dur": 0.536, + "args": { + "External id": 442499,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "80910720"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573503.749, "dur": 1.686, + "args": { + "External id": 442500,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "81271168"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573506.224, "dur": 0.394, + "args": { + "External id": 442501,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "81631616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573508.981, "dur": 2.053, + "args": { + "External id": 442502,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "81992064"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573511.805, "dur": 0.421, + "args": { + "External id": 442503,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "81992192"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573512.808, "dur": 0.462, + "args": { + "External id": 442504,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "82123264"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573519.057, "dur": 0.568, + "args": { + "External id": 442505,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "82254336"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573520.161, "dur": 0.621, + "args": { + "External id": 442506,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "82385408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573522.221, "dur": 0.322, + "args": { + "External id": 442507,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "82516480"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573527.661, "dur": 2.129, + "args": { + "External id": 442508,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "82516608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573530.422, "dur": 0.266, + "args": { + "External id": 442509,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "82877056"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573533.751, "dur": 2.513, + "args": { + "External id": 442510,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "83237504"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573537.213, "dur": 0.683, + "args": { + "External id": 442511,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "83597952"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007573538.592, "dur": 0.828, + "args": { + "External id": 442512,"Record function id": 0, "Concrete Inputs": ["", "[4096000]", "[1]", "83598080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[14615680], [], [], []], "Ev Idx": 4735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007573580.937, "dur": 34.532, + "args": { + "External id": 442513,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 4736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007573731.667, "dur": 378.970, + "args": { + "External id": 442514,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[116925440], [14615680], [], [], []], "Ev Idx": 4737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007573765.976, "dur": 338.730, + "args": { + "External id": 442515,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 116925440, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[14615680], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4738, "In msg nelems": 14615680 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007573777.025, "dur": 320.390, + "args": { + "External id": 442516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[14615680]], "Ev Idx": 4739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007574138.121, "dur": 2.995, + "args": { + "External id": 442517,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4740, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out", "pid": 4183441, "tid": 4183441, + "ts": 676007574249.810, "dur": 5538.991, + "args": { + "External id": 442518,"Record function id": 0, "Ev Idx": 4741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574475.595, "dur": 6.986, + "args": { + "External id": 442519,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[116925440], []], "Ev Idx": 4742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574486.634, "dur": 1.463, + "args": { + "External id": 442520,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[32768000], []], "Ev Idx": 4743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574489.792, "dur": 1.059, + "args": { + "External id": 442521,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574492.470, "dur": 2.593, + "args": { + "External id": 442522,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574498.475, "dur": 1.215, + "args": { + "External id": 442523,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574501.478, "dur": 0.907, + "args": { + "External id": 442524,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574503.921, "dur": 1.027, + "args": { + "External id": 442525,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574506.230, "dur": 1.998, + "args": { + "External id": 442526,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574514.405, "dur": 0.852, + "args": { + "External id": 442527,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574516.509, "dur": 1.123, + "args": { + "External id": 442528,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574519.010, "dur": 1.119, + "args": { + "External id": 442529,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574521.648, "dur": 2.701, + "args": { + "External id": 442530,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574527.539, "dur": 0.856, + "args": { + "External id": 442531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574530.112, "dur": 1.149, + "args": { + "External id": 442532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574532.547, "dur": 1.138, + "args": { + "External id": 442533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574534.892, "dur": 2.859, + "args": { + "External id": 442534,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574543.232, "dur": 0.983, + "args": { + "External id": 442535,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574545.485, "dur": 0.667, + "args": { + "External id": 442536,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574547.881, "dur": 1.042, + "args": { + "External id": 442537,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574550.174, "dur": 2.742, + "args": { + "External id": 442538,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574556.526, "dur": 0.811, + "args": { + "External id": 442539,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574558.620, "dur": 0.714, + "args": { + "External id": 442540,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574560.882, "dur": 0.738, + "args": { + "External id": 442541,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574563.180, "dur": 1.873, + "args": { + "External id": 442542,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574584.261, "dur": 0.706, + "args": { + "External id": 442543,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574586.223, "dur": 1.042, + "args": { + "External id": 442544,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574588.840, "dur": 0.714, + "args": { + "External id": 442545,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574591.106, "dur": 2.529, + "args": { + "External id": 442546,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574597.736, "dur": 0.859, + "args": { + "External id": 442547,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574599.800, "dur": 0.867, + "args": { + "External id": 442548,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574602.163, "dur": 0.995, + "args": { + "External id": 442549,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574604.769, "dur": 2.144, + "args": { + "External id": 442550,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574613.184, "dur": 1.337, + "args": { + "External id": 442551,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574615.788, "dur": 1.433, + "args": { + "External id": 442552,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574618.879, "dur": 0.866, + "args": { + "External id": 442553,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574621.019, "dur": 2.553, + "args": { + "External id": 442554,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574627.112, "dur": 0.571, + "args": { + "External id": 442555,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574629.011, "dur": 1.340, + "args": { + "External id": 442556,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574631.734, "dur": 0.909, + "args": { + "External id": 442557,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007574633.889, "dur": 2.385, + "args": { + "External id": 442558,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[32768000], []], "Ev Idx": 4781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007574705.217, "dur": 5025.603, + "args": { + "External id": 442559,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[14615680, 1], [], [], []], "Input Dims": [[8, 14615680], [], [], []], "Ev Idx": 4782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007574732.195, "dur": 4989.118, + "args": { + "External id": 442560,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[14615680, 1], [], [], []], "Input Dims": [[8, 14615680], [], [], []], "Ev Idx": 4783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007574752.735, "dur": 6.240, + "args": { + "External id": 442561,"Record function id": 0, "Concrete Inputs": ["[3034]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007574763.972, "dur": 4916.534, + "args": { + "External id": 442562,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[3034], [], [], [], [], [], [], []], "Ev Idx": 4785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007574766.710, "dur": 4885.982, + "args": { + "External id": 442563,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[3034], [], [], [], [], [], []], "Ev Idx": 4786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007574774.159, "dur": 6.961, + "args": { + "External id": 442564,"Record function id": 0, "Concrete Inputs": ["[3034]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007574782.727, "dur": 4866.576, + "args": { + "External id": 442565,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[3034], [3034], []], "Ev Idx": 4788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007580093.792, "dur": 40.760, + "args": { + "External id": 442566,"Record function id": 0, "Ev Idx": 4789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 0/0", "pid": 4183441, "tid": 4183441, + "ts": 676007580136.930, "dur": 224.557, + "args": { + "External id": 442567,"Record function id": 0, "Ev Idx": 4790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007580181.074, "dur": 171.172, + "args": { + "External id": 442568,"Sequence number": 5285388, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "long int"], "Input Strides": [[1024, 1], [4096, 1]], "Input Dims": [[32000, 1024], [16, 4096]], "Ev Idx": 4791 + } + }, + { + "ph": "s", "id": 212, "pid": 4183441, "tid": 4183441, "ts": 676007580181.074, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_0", "pid": 4183441, "tid": 4183441, + "ts": 676007580261.275, "dur": 49.909, + "args": { + "External id": 442569,"kernel_hash": "chibah4fn4h2t2uavsaujvzp4is3c5kamcj5b6bik3gl2uvrmaxd", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/hi/chibah4fn4h2t2uavsaujvzp4is3c5kamcj5b6bik3gl2uvrmaxd.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], [1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096], [32000, 1024], [16, 4096, 1024], []], "Ev Idx": 4792 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007580424.069, "dur": 57.890, + "args": { + "External id": 442570,"Record function id": 0, "Ev Idx": 4793 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.0)", "pid": 4183441, "tid": 4183441, + "ts": 676007580492.699, "dur": 6696.546, + "args": { + "External id": 442571,"Record function id": 0, "Ev Idx": 4794 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 4183441, "tid": 4183441, + "ts": 676007580501.092, "dur": 887.457, + "args": { + "External id": 442572,"Record function id": 0, "Ev Idx": 4795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007580578.444, "dur": 11.410, + "args": { + "External id": 442573,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007580603.563, "dur": 46.108, + "args": { + "External id": 442574,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580614.164, "dur": 2.494, + "args": { + "External id": 442575,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580618.417, "dur": 0.467, + "args": { + "External id": 442576,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580619.691, "dur": 2.813, + "args": { + "External id": 442577,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580625.061, "dur": 0.454, + "args": { + "External id": 442578,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580626.272, "dur": 0.365, + "args": { + "External id": 442579,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580629.561, "dur": 0.360, + "args": { + "External id": 442580,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580632.574, "dur": 0.268, + "args": { + "External id": 442581,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580633.637, "dur": 2.299, + "args": { + "External id": 442582,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580640.993, "dur": 0.465, + "args": { + "External id": 442583,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007580698.400, "dur": 40.612, + "args": { + "External id": 442584,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007580774.385, "dur": 125.037, + "args": { + "External id": 442585,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007580786.430, "dur": 6.659, + "args": { + "External id": 442586,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007580799.276, "dur": 12.440, + "args": { + "External id": 442587,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007580803.667, "dur": 7.657, + "args": { + "External id": 442588,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580808.951, "dur": 0.721, + "args": { + "External id": 442589,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007580818.774, "dur": 33.425, + "args": { + "External id": 442590,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580820.301, "dur": 0.820, + "args": { + "External id": 442591,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580824.041, "dur": 0.933, + "args": { + "External id": 442592,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580827.679, "dur": 0.761, + "args": { + "External id": 442593,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580829.158, "dur": 0.650, + "args": { + "External id": 442594,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580832.841, "dur": 3.852, + "args": { + "External id": 442595,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580837.356, "dur": 0.309, + "args": { + "External id": 442596,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580840.993, "dur": 0.543, + "args": { + "External id": 442597,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580844.503, "dur": 0.761, + "args": { + "External id": 442598,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007580846.058, "dur": 0.400, + "args": { + "External id": 442599,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007580866.176, "dur": 24.637, + "args": { + "External id": 442600,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007580949.404, "dur": 341.246, + "args": { + "External id": 442601,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007580978.630, "dur": 306.383, + "args": { + "External id": 442602,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4825, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007580991.310, "dur": 288.023, + "args": { + "External id": 442603,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007581318.248, "dur": 2.713, + "args": { + "External id": 442604,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4827, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 4183441, "tid": 4183441, + "ts": 676007581409.535, "dur": 5548.880, + "args": { + "External id": 442605,"Record function id": 0, "Ev Idx": 4828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581516.301, "dur": 6.353, + "args": { + "External id": 442606,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581526.095, "dur": 1.424, + "args": { + "External id": 442607,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581529.069, "dur": 1.188, + "args": { + "External id": 442608,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581532.231, "dur": 3.366, + "args": { + "External id": 442609,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581536.973, "dur": 1.277, + "args": { + "External id": 442610,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581541.759, "dur": 0.998, + "args": { + "External id": 442611,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581544.179, "dur": 0.848, + "args": { + "External id": 442612,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581546.753, "dur": 2.725, + "args": { + "External id": 442613,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581553.426, "dur": 0.857, + "args": { + "External id": 442614,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007581558.078, "dur": 0.867, + "args": { + "External id": 442615,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007581575.179, "dur": 5344.965, + "args": { + "External id": 442616,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007581592.520, "dur": 5320.810, + "args": { + "External id": 442617,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007581613.759, "dur": 14.165, + "args": { + "External id": 442618,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007581630.936, "dur": 5251.220, + "args": { + "External id": 442619,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007581633.321, "dur": 5248.378, + "args": { + "External id": 442620,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007581639.912, "dur": 7.398, + "args": { + "External id": 442621,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007581648.916, "dur": 5229.419, + "args": { + "External id": 442622,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007587130.708, "dur": 32.485, + "args": { + "External id": 442623,"Sequence number": 5285389, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4846 + } + }, + { + "ph": "s", "id": 211, "pid": 4183441, "tid": 4183441, "ts": 676007587130.708, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007587147.472, "dur": 10.777, + "args": { + "External id": 442624,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 4847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007587153.280, "dur": 4.593, + "args": { + "External id": 442625,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 4848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007587230.682, "dur": 103.202, + "args": { + "External id": 442626,"Record function id": 0, "Ev Idx": 4849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007587335.333, "dur": 1188.871, + "args": { + "External id": 442627,"Record function id": 0, "Ev Idx": 4850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007587377.191, "dur": 1132.287, + "args": { + "External id": 442628,"Sequence number": 5285390, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 4851 + } + }, + { + "ph": "s", "id": 210, "pid": 4183441, "tid": 4183441, "ts": 676007587377.191, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007587443.839, "dur": 43.569, + "args": { + "External id": 442629,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007587500.229, "dur": 93.239, + "args": { + "External id": 442630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007587605.253, "dur": 34.370, + "args": { + "External id": 442631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007587650.434, "dur": 95.238, + "args": { + "External id": 442632,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007587776.641, "dur": 28.748, + "args": { + "External id": 442633,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007587824.864, "dur": 16.554, + "args": { + "External id": 442634,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007587862.316, "dur": 133.180, + "args": { + "External id": 442635,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 4858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007587916.227, "dur": 12.047, + "args": { + "External id": 442636,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 4859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007587921.158, "dur": 6.276, + "args": { + "External id": 442637,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007587930.574, "dur": 3.527, + "args": { + "External id": 442638,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007587937.869, "dur": 1.193, + "args": { + "External id": 442639,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007587941.408, "dur": 2.681, + "args": { + "External id": 442640,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007588006.408, "dur": 48.360, + "args": { + "External id": 442641,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007588124.852, "dur": 31.942, + "args": { + "External id": 442642,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007588166.339, "dur": 58.370, + "args": { + "External id": 442643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007588233.659, "dur": 49.199, + "args": { + "External id": 442644,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007588308.289, "dur": 26.990, + "args": { + "External id": 442645,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 4868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007588341.235, "dur": 32.980, + "args": { + "External id": 442646,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007588398.919, "dur": 20.447, + "args": { + "External id": 442647,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 4870 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.0)", "pid": 4183441, "tid": 4183441, + "ts": 676007588592.141, "dur": 164.491, + "args": { + "External id": 442648,"Record function id": 0, "Ev Idx": 4871 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007588840.269, "dur": 48.307, + "args": { + "External id": 442649,"Record function id": 0, "Ev Idx": 4872 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.1)", "pid": 4183441, "tid": 4183441, + "ts": 676007588897.877, "dur": 10692.630, + "args": { + "External id": 442650,"Record function id": 0, "Ev Idx": 4873 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 4183441, "tid": 4183441, + "ts": 676007588908.811, "dur": 1016.582, + "args": { + "External id": 442651,"Record function id": 0, "Ev Idx": 4874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007588995.321, "dur": 9.017, + "args": { + "External id": 442652,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007589018.297, "dur": 46.364, + "args": { + "External id": 442653,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589025.762, "dur": 3.967, + "args": { + "External id": 442654,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589031.503, "dur": 0.647, + "args": { + "External id": 442655,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589032.914, "dur": 0.422, + "args": { + "External id": 442656,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589039.261, "dur": 0.729, + "args": { + "External id": 442657,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589041.022, "dur": 2.253, + "args": { + "External id": 442658,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589046.063, "dur": 0.355, + "args": { + "External id": 442659,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589049.388, "dur": 0.360, + "args": { + "External id": 442660,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589050.479, "dur": 0.473, + "args": { + "External id": 442661,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589054.484, "dur": 2.570, + "args": { + "External id": 442662,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007589075.582, "dur": 80.638, + "args": { + "External id": 442663,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007589195.906, "dur": 133.038, + "args": { + "External id": 442664,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007589206.719, "dur": 5.052, + "args": { + "External id": 442665,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007589217.749, "dur": 12.863, + "args": { + "External id": 442666,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007589222.577, "dur": 7.614, + "args": { + "External id": 442667,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589227.802, "dur": 0.637, + "args": { + "External id": 442668,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007589237.961, "dur": 36.036, + "args": { + "External id": 442669,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589239.543, "dur": 0.488, + "args": { + "External id": 442670,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589243.576, "dur": 2.389, + "args": { + "External id": 442671,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589246.693, "dur": 3.127, + "args": { + "External id": 442672,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589253.607, "dur": 0.482, + "args": { + "External id": 442673,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589254.915, "dur": 0.513, + "args": { + "External id": 442674,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589258.373, "dur": 0.384, + "args": { + "External id": 442675,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589262.143, "dur": 0.554, + "args": { + "External id": 442676,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589263.570, "dur": 0.465, + "args": { + "External id": 442677,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007589267.209, "dur": 0.572, + "args": { + "External id": 442678,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007589290.664, "dur": 27.135, + "args": { + "External id": 442679,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007589385.468, "dur": 439.262, + "args": { + "External id": 442680,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007589417.857, "dur": 401.174, + "args": { + "External id": 442681,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4904, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007589429.208, "dur": 383.138, + "args": { + "External id": 442682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007589849.350, "dur": 2.482, + "args": { + "External id": 442683,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4906, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 4183441, "tid": 4183441, + "ts": 676007589946.663, "dur": 9435.434, + "args": { + "External id": 442684,"Record function id": 0, "Ev Idx": 4907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590049.129, "dur": 6.467, + "args": { + "External id": 442685,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590058.889, "dur": 1.723, + "args": { + "External id": 442686,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590062.360, "dur": 1.069, + "args": { + "External id": 442687,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590065.030, "dur": 1.476, + "args": { + "External id": 442688,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590068.159, "dur": 1.231, + "args": { + "External id": 442689,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590072.676, "dur": 1.044, + "args": { + "External id": 442690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590075.398, "dur": 1.498, + "args": { + "External id": 442691,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590080.533, "dur": 29.874, + "args": { + "External id": 442692,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590114.485, "dur": 1.027, + "args": { + "External id": 442693,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007590119.155, "dur": 1.085, + "args": { + "External id": 442694,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007590139.280, "dur": 9201.091, + "args": { + "External id": 442695,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007590156.279, "dur": 9177.032, + "args": { + "External id": 442696,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007590185.331, "dur": 13.935, + "args": { + "External id": 442697,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007590202.191, "dur": 9096.696, + "args": { + "External id": 442698,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 4921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007590204.765, "dur": 9093.381, + "args": { + "External id": 442699,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 4922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007590211.068, "dur": 5.117, + "args": { + "External id": 442700,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007590217.966, "dur": 9077.187, + "args": { + "External id": 442701,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 4924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007599534.283, "dur": 30.279, + "args": { + "External id": 442702,"Sequence number": 5285391, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 4925 + } + }, + { + "ph": "s", "id": 209, "pid": 4183441, "tid": 4183441, "ts": 676007599534.283, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007599550.312, "dur": 9.579, + "args": { + "External id": 442703,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 4926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007599555.661, "dur": 4.031, + "args": { + "External id": 442704,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 4927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007599632.824, "dur": 143.579, + "args": { + "External id": 442705,"Record function id": 0, "Ev Idx": 4928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007599779.271, "dur": 1155.993, + "args": { + "External id": 442706,"Record function id": 0, "Ev Idx": 4929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007599821.720, "dur": 1099.138, + "args": { + "External id": 442707,"Sequence number": 5285392, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 4930 + } + }, + { + "ph": "s", "id": 208, "pid": 4183441, "tid": 4183441, "ts": 676007599821.720, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007599912.131, "dur": 44.383, + "args": { + "External id": 442708,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007599972.564, "dur": 94.723, + "args": { + "External id": 442709,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007600075.745, "dur": 73.916, + "args": { + "External id": 442710,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007600159.195, "dur": 30.787, + "args": { + "External id": 442711,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007600225.005, "dur": 27.448, + "args": { + "External id": 442712,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007600268.892, "dur": 18.068, + "args": { + "External id": 442713,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007600302.482, "dur": 135.887, + "args": { + "External id": 442714,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 4937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007600352.963, "dur": 15.086, + "args": { + "External id": 442715,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 4938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007600357.572, "dur": 9.695, + "args": { + "External id": 442716,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007600372.543, "dur": 4.183, + "args": { + "External id": 442717,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007600377.818, "dur": 3.017, + "args": { + "External id": 442718,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007600383.095, "dur": 2.630, + "args": { + "External id": 442719,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007600449.378, "dur": 46.946, + "args": { + "External id": 442720,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 4943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007600528.810, "dur": 30.234, + "args": { + "External id": 442721,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 4944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007600569.661, "dur": 37.880, + "args": { + "External id": 442722,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007600614.132, "dur": 34.702, + "args": { + "External id": 442723,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 4946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007600729.889, "dur": 30.191, + "args": { + "External id": 442724,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 4947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007600767.011, "dur": 41.017, + "args": { + "External id": 442725,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 4948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007600827.409, "dur": 22.635, + "args": { + "External id": 442726,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 4949 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.1)", "pid": 4183441, "tid": 4183441, + "ts": 676007600999.566, "dur": 111.054, + "args": { + "External id": 442727,"Record function id": 0, "Ev Idx": 4950 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007601191.490, "dur": 47.250, + "args": { + "External id": 442728,"Record function id": 0, "Ev Idx": 4951 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.2)", "pid": 4183441, "tid": 4183441, + "ts": 676007601248.314, "dur": 9220.375, + "args": { + "External id": 442729,"Record function id": 0, "Ev Idx": 4952 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 4183441, "tid": 4183441, + "ts": 676007601260.844, "dur": 970.400, + "args": { + "External id": 442730,"Record function id": 0, "Ev Idx": 4953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007601345.910, "dur": 9.950, + "args": { + "External id": 442731,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007601368.918, "dur": 45.546, + "args": { + "External id": 442732,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601376.514, "dur": 2.424, + "args": { + "External id": 442733,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601382.948, "dur": 0.494, + "args": { + "External id": 442734,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601386.738, "dur": 0.576, + "args": { + "External id": 442735,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601387.969, "dur": 0.549, + "args": { + "External id": 442736,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601391.511, "dur": 0.536, + "args": { + "External id": 442737,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601395.116, "dur": 0.713, + "args": { + "External id": 442738,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601396.723, "dur": 4.305, + "args": { + "External id": 442739,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601401.756, "dur": 0.408, + "args": { + "External id": 442740,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601405.843, "dur": 0.292, + "args": { + "External id": 442741,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007601426.083, "dur": 43.720, + "args": { + "External id": 442742,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007601503.333, "dur": 115.652, + "args": { + "External id": 442743,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 4966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007601517.546, "dur": 3.548, + "args": { + "External id": 442744,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007601526.530, "dur": 9.874, + "args": { + "External id": 442745,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007601531.292, "dur": 4.718, + "args": { + "External id": 442746,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 4969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601534.198, "dur": 0.483, + "args": { + "External id": 442747,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 4970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007601542.498, "dur": 36.283, + "args": { + "External id": 442748,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 4971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601545.684, "dur": 2.988, + "args": { + "External id": 442749,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601549.643, "dur": 0.614, + "args": { + "External id": 442750,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601551.143, "dur": 0.563, + "args": { + "External id": 442751,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601557.264, "dur": 2.786, + "args": { + "External id": 442752,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601560.879, "dur": 0.510, + "args": { + "External id": 442753,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601562.116, "dur": 0.407, + "args": { + "External id": 442754,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601566.203, "dur": 0.402, + "args": { + "External id": 442755,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601567.190, "dur": 0.439, + "args": { + "External id": 442756,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007601570.560, "dur": 2.292, + "args": { + "External id": 442757,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 4980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007601588.728, "dur": 22.333, + "args": { + "External id": 442758,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 4981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007601724.158, "dur": 408.063, + "args": { + "External id": 442759,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 4982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007601760.241, "dur": 366.466, + "args": { + "External id": 442760,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4983, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007601771.692, "dur": 349.252, + "args": { + "External id": 442761,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 4984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007602156.413, "dur": 2.623, + "args": { + "External id": 442762,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4985, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 4183441, "tid": 4183441, + "ts": 676007602251.316, "dur": 8019.089, + "args": { + "External id": 442763,"Record function id": 0, "Ev Idx": 4986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602354.371, "dur": 6.530, + "args": { + "External id": 442764,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 4987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602364.317, "dur": 1.594, + "args": { + "External id": 442765,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602367.418, "dur": 3.856, + "args": { + "External id": 442766,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602373.248, "dur": 1.067, + "args": { + "External id": 442767,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602375.625, "dur": 1.278, + "args": { + "External id": 442768,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602381.109, "dur": 1.219, + "args": { + "External id": 442769,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 4992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602385.586, "dur": 1.582, + "args": { + "External id": 442770,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 4993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602388.400, "dur": 2.189, + "args": { + "External id": 442771,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602391.733, "dur": 0.758, + "args": { + "External id": 442772,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007602395.679, "dur": 0.896, + "args": { + "External id": 442773,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 4996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007602412.996, "dur": 7820.814, + "args": { + "External id": 442774,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007602430.170, "dur": 7797.399, + "args": { + "External id": 442775,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 4998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007602447.286, "dur": 16.215, + "args": { + "External id": 442776,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007602466.865, "dur": 7725.198, + "args": { + "External id": 442777,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007602469.404, "dur": 7722.150, + "args": { + "External id": 442778,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007602475.348, "dur": 4.914, + "args": { + "External id": 442779,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007602481.920, "dur": 7706.242, + "args": { + "External id": 442780,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007610414.901, "dur": 30.439, + "args": { + "External id": 442781,"Sequence number": 5285393, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5004 + } + }, + { + "ph": "s", "id": 207, "pid": 4183441, "tid": 4183441, "ts": 676007610414.901, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007610430.939, "dur": 9.833, + "args": { + "External id": 442782,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007610436.294, "dur": 4.226, + "args": { + "External id": 442783,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007610510.958, "dur": 91.741, + "args": { + "External id": 442784,"Record function id": 0, "Ev Idx": 5007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007610604.025, "dur": 1125.861, + "args": { + "External id": 442785,"Record function id": 0, "Ev Idx": 5008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007610643.408, "dur": 1069.864, + "args": { + "External id": 442786,"Sequence number": 5285394, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5009 + } + }, + { + "ph": "s", "id": 206, "pid": 4183441, "tid": 4183441, "ts": 676007610643.408, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007610751.102, "dur": 44.041, + "args": { + "External id": 442787,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007610808.469, "dur": 93.614, + "args": { + "External id": 442788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007610912.869, "dur": 35.563, + "args": { + "External id": 442789,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007610956.458, "dur": 29.393, + "args": { + "External id": 442790,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007611011.542, "dur": 28.757, + "args": { + "External id": 442791,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007611060.239, "dur": 15.588, + "args": { + "External id": 442792,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007611112.068, "dur": 135.479, + "args": { + "External id": 442793,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007611163.756, "dur": 14.453, + "args": { + "External id": 442794,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007611168.686, "dur": 8.643, + "args": { + "External id": 442795,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007611182.835, "dur": 3.671, + "args": { + "External id": 442796,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007611187.495, "dur": 0.933, + "args": { + "External id": 442797,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007611190.738, "dur": 3.372, + "args": { + "External id": 442798,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007611258.620, "dur": 50.091, + "args": { + "External id": 442799,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007611337.787, "dur": 28.866, + "args": { + "External id": 442800,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007611374.480, "dur": 38.036, + "args": { + "External id": 442801,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007611421.093, "dur": 30.644, + "args": { + "External id": 442802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007611475.684, "dur": 25.133, + "args": { + "External id": 442803,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007611506.058, "dur": 44.412, + "args": { + "External id": 442804,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007611572.282, "dur": 19.351, + "args": { + "External id": 442805,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5028 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.2)", "pid": 4183441, "tid": 4183441, + "ts": 676007611796.427, "dur": 86.596, + "args": { + "External id": 442806,"Record function id": 0, "Ev Idx": 5029 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007611957.597, "dur": 47.274, + "args": { + "External id": 442807,"Record function id": 0, "Ev Idx": 5030 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.3)", "pid": 4183441, "tid": 4183441, + "ts": 676007612013.774, "dur": 8822.203, + "args": { + "External id": 442808,"Record function id": 0, "Ev Idx": 5031 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 4183441, "tid": 4183441, + "ts": 676007612025.047, "dur": 973.617, + "args": { + "External id": 442809,"Record function id": 0, "Ev Idx": 5032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007612128.685, "dur": 10.130, + "args": { + "External id": 442810,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007612152.497, "dur": 45.435, + "args": { + "External id": 442811,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612158.944, "dur": 2.240, + "args": { + "External id": 442812,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612165.481, "dur": 0.276, + "args": { + "External id": 442813,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612168.757, "dur": 0.322, + "args": { + "External id": 442814,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612174.333, "dur": 0.386, + "args": { + "External id": 442815,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612177.526, "dur": 0.408, + "args": { + "External id": 442816,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612180.607, "dur": 0.356, + "args": { + "External id": 442817,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612181.795, "dur": 3.718, + "args": { + "External id": 442818,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612186.050, "dur": 0.306, + "args": { + "External id": 442819,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612189.141, "dur": 0.277, + "args": { + "External id": 442820,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007612209.981, "dur": 46.284, + "args": { + "External id": 442821,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007612289.285, "dur": 134.373, + "args": { + "External id": 442822,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007612303.423, "dur": 3.600, + "args": { + "External id": 442823,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007612312.712, "dur": 9.448, + "args": { + "External id": 442824,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007612317.220, "dur": 4.553, + "args": { + "External id": 442825,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612320.012, "dur": 0.645, + "args": { + "External id": 442826,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007612328.507, "dur": 36.364, + "args": { + "External id": 442827,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612331.687, "dur": 2.744, + "args": { + "External id": 442828,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612335.418, "dur": 0.447, + "args": { + "External id": 442829,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612336.502, "dur": 0.329, + "args": { + "External id": 442830,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612342.450, "dur": 1.696, + "args": { + "External id": 442831,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612344.756, "dur": 0.453, + "args": { + "External id": 442832,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612345.977, "dur": 0.292, + "args": { + "External id": 442833,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612351.934, "dur": 0.294, + "args": { + "External id": 442834,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612353.240, "dur": 0.249, + "args": { + "External id": 442835,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007612356.273, "dur": 2.744, + "args": { + "External id": 442836,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007612390.580, "dur": 24.540, + "args": { + "External id": 442837,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007612478.696, "dur": 422.226, + "args": { + "External id": 442838,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007612512.257, "dur": 382.995, + "args": { + "External id": 442839,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5062, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007612523.884, "dur": 365.229, + "args": { + "External id": 442840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007612924.302, "dur": 2.522, + "args": { + "External id": 442841,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5064, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 4183441, "tid": 4183441, + "ts": 676007613019.664, "dur": 7574.572, + "args": { + "External id": 442842,"Record function id": 0, "Ev Idx": 5065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613138.619, "dur": 6.695, + "args": { + "External id": 442843,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613148.783, "dur": 1.257, + "args": { + "External id": 442844,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613151.700, "dur": 2.541, + "args": { + "External id": 442845,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613155.626, "dur": 0.898, + "args": { + "External id": 442846,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613157.851, "dur": 1.090, + "args": { + "External id": 442847,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613163.577, "dur": 1.125, + "args": { + "External id": 442848,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613168.709, "dur": 1.132, + "args": { + "External id": 442849,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613171.144, "dur": 2.829, + "args": { + "External id": 442850,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613175.509, "dur": 0.943, + "args": { + "External id": 442851,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007613180.243, "dur": 0.969, + "args": { + "External id": 442852,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007613198.523, "dur": 7356.131, + "args": { + "External id": 442853,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007613215.987, "dur": 7331.804, + "args": { + "External id": 442854,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007613233.322, "dur": 15.668, + "args": { + "External id": 442855,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007613251.782, "dur": 7262.813, + "args": { + "External id": 442856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007613254.705, "dur": 7259.377, + "args": { + "External id": 442857,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007613260.705, "dur": 6.339, + "args": { + "External id": 442858,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007613268.844, "dur": 7242.181, + "args": { + "External id": 442859,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007620762.269, "dur": 48.356, + "args": { + "External id": 442860,"Sequence number": 5285395, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5083 + } + }, + { + "ph": "s", "id": 205, "pid": 4183441, "tid": 4183441, "ts": 676007620762.269, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007620794.776, "dur": 11.067, + "args": { + "External id": 442861,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007620800.825, "dur": 4.653, + "args": { + "External id": 442862,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007620876.486, "dur": 94.743, + "args": { + "External id": 442863,"Record function id": 0, "Ev Idx": 5086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007620972.635, "dur": 1150.561, + "args": { + "External id": 442864,"Record function id": 0, "Ev Idx": 5087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007621013.770, "dur": 1093.400, + "args": { + "External id": 442865,"Sequence number": 5285396, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5088 + } + }, + { + "ph": "s", "id": 204, "pid": 4183441, "tid": 4183441, "ts": 676007621013.770, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007621097.614, "dur": 42.433, + "args": { + "External id": 442866,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007621153.824, "dur": 93.098, + "args": { + "External id": 442867,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007621260.419, "dur": 34.742, + "args": { + "External id": 442868,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007621300.892, "dur": 28.969, + "args": { + "External id": 442869,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007621362.877, "dur": 25.539, + "args": { + "External id": 442870,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007621405.091, "dur": 17.148, + "args": { + "External id": 442871,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007621440.161, "dur": 133.948, + "args": { + "External id": 442872,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007621490.839, "dur": 11.321, + "args": { + "External id": 442873,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007621495.565, "dur": 5.635, + "args": { + "External id": 442874,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007621506.938, "dur": 5.722, + "args": { + "External id": 442875,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007621513.831, "dur": 0.891, + "args": { + "External id": 442876,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007621519.148, "dur": 2.883, + "args": { + "External id": 442877,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007621584.453, "dur": 44.538, + "args": { + "External id": 442878,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007621700.474, "dur": 35.767, + "args": { + "External id": 442879,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007621747.337, "dur": 43.297, + "args": { + "External id": 442880,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007621818.337, "dur": 49.852, + "args": { + "External id": 442881,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007621897.504, "dur": 27.248, + "args": { + "External id": 442882,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007621930.425, "dur": 48.895, + "args": { + "External id": 442883,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007621997.121, "dur": 21.388, + "args": { + "External id": 442884,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5107 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.3)", "pid": 4183441, "tid": 4183441, + "ts": 676007622190.724, "dur": 86.746, + "args": { + "External id": 442885,"Record function id": 0, "Ev Idx": 5108 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007622352.938, "dur": 46.837, + "args": { + "External id": 442886,"Record function id": 0, "Ev Idx": 5109 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.4)", "pid": 4183441, "tid": 4183441, + "ts": 676007622408.546, "dur": 9240.410, + "args": { + "External id": 442887,"Record function id": 0, "Ev Idx": 5110 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 4183441, "tid": 4183441, + "ts": 676007622420.299, "dur": 949.279, + "args": { + "External id": 442888,"Record function id": 0, "Ev Idx": 5111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007622505.030, "dur": 8.423, + "args": { + "External id": 442889,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007622527.026, "dur": 43.440, + "args": { + "External id": 442890,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622534.208, "dur": 2.400, + "args": { + "External id": 442891,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622540.574, "dur": 0.274, + "args": { + "External id": 442892,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622544.266, "dur": 0.302, + "args": { + "External id": 442893,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622545.362, "dur": 0.426, + "args": { + "External id": 442894,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622548.637, "dur": 0.420, + "args": { + "External id": 442895,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622552.265, "dur": 0.472, + "args": { + "External id": 442896,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622553.404, "dur": 3.587, + "args": { + "External id": 442897,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622557.816, "dur": 0.375, + "args": { + "External id": 442898,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622561.343, "dur": 0.152, + "args": { + "External id": 442899,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007622582.581, "dur": 40.402, + "args": { + "External id": 442900,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007622696.117, "dur": 121.066, + "args": { + "External id": 442901,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007622712.165, "dur": 5.346, + "args": { + "External id": 442902,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007622723.622, "dur": 10.765, + "args": { + "External id": 442903,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007622728.414, "dur": 5.579, + "args": { + "External id": 442904,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622731.601, "dur": 0.702, + "args": { + "External id": 442905,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007622741.747, "dur": 31.644, + "args": { + "External id": 442906,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622744.777, "dur": 2.250, + "args": { + "External id": 442907,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622748.253, "dur": 0.387, + "args": { + "External id": 442908,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622749.404, "dur": 0.256, + "args": { + "External id": 442909,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622754.654, "dur": 1.624, + "args": { + "External id": 442910,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622757.439, "dur": 0.398, + "args": { + "External id": 442911,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622758.468, "dur": 0.356, + "args": { + "External id": 442912,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622761.579, "dur": 0.500, + "args": { + "External id": 442913,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622762.604, "dur": 0.309, + "args": { + "External id": 442914,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007622765.021, "dur": 2.281, + "args": { + "External id": 442915,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007622783.816, "dur": 24.747, + "args": { + "External id": 442916,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007622872.677, "dur": 398.546, + "args": { + "External id": 442917,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007622908.390, "dur": 356.722, + "args": { + "External id": 442918,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5141, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007622918.804, "dur": 340.300, + "args": { + "External id": 442919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007623295.974, "dur": 2.604, + "args": { + "External id": 442920,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5143, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 4183441, "tid": 4183441, + "ts": 676007623390.879, "dur": 8069.938, + "args": { + "External id": 442921,"Record function id": 0, "Ev Idx": 5144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623489.292, "dur": 6.272, + "args": { + "External id": 442922,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623498.756, "dur": 1.229, + "args": { + "External id": 442923,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623501.963, "dur": 2.612, + "args": { + "External id": 442924,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623506.452, "dur": 1.041, + "args": { + "External id": 442925,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623508.776, "dur": 1.078, + "args": { + "External id": 442926,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623511.289, "dur": 0.887, + "args": { + "External id": 442927,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623516.157, "dur": 1.156, + "args": { + "External id": 442928,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623518.776, "dur": 2.546, + "args": { + "External id": 442929,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623522.542, "dur": 0.877, + "args": { + "External id": 442930,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007623524.609, "dur": 0.737, + "args": { + "External id": 442931,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007623544.936, "dur": 7878.278, + "args": { + "External id": 442932,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007623562.005, "dur": 7855.137, + "args": { + "External id": 442933,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007623577.637, "dur": 15.276, + "args": { + "External id": 442934,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007623595.565, "dur": 7788.950, + "args": { + "External id": 442935,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007623598.133, "dur": 7785.902, + "args": { + "External id": 442936,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007623603.847, "dur": 4.506, + "args": { + "External id": 442937,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007623610.019, "dur": 7771.220, + "args": { + "External id": 442938,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007631594.989, "dur": 29.999, + "args": { + "External id": 442939,"Sequence number": 5285397, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5162 + } + }, + { + "ph": "s", "id": 203, "pid": 4183441, "tid": 4183441, "ts": 676007631594.989, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007631611.183, "dur": 9.386, + "args": { + "External id": 442940,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007631616.156, "dur": 4.231, + "args": { + "External id": 442941,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007631719.220, "dur": 93.697, + "args": { + "External id": 442942,"Record function id": 0, "Ev Idx": 5165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007631815.154, "dur": 1114.081, + "args": { + "External id": 442943,"Record function id": 0, "Ev Idx": 5166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007631857.407, "dur": 1057.310, + "args": { + "External id": 442944,"Sequence number": 5285398, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5167 + } + }, + { + "ph": "s", "id": 202, "pid": 4183441, "tid": 4183441, "ts": 676007631857.407, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007631924.742, "dur": 44.562, + "args": { + "External id": 442945,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007631982.708, "dur": 92.667, + "args": { + "External id": 442946,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007632105.162, "dur": 39.761, + "args": { + "External id": 442947,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007632155.824, "dur": 28.447, + "args": { + "External id": 442948,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007632212.643, "dur": 27.629, + "args": { + "External id": 442949,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007632257.331, "dur": 15.788, + "args": { + "External id": 442950,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007632291.565, "dur": 132.565, + "args": { + "External id": 442951,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007632341.554, "dur": 10.965, + "args": { + "External id": 442952,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007632346.342, "dur": 5.355, + "args": { + "External id": 442953,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007632357.099, "dur": 7.763, + "args": { + "External id": 442954,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007632366.169, "dur": 0.947, + "args": { + "External id": 442955,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007632369.306, "dur": 4.088, + "args": { + "External id": 442956,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007632435.085, "dur": 44.434, + "args": { + "External id": 442957,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007632509.642, "dur": 27.189, + "args": { + "External id": 442958,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007632545.476, "dur": 35.750, + "args": { + "External id": 442959,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007632589.931, "dur": 31.031, + "args": { + "External id": 442960,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007632644.475, "dur": 75.006, + "args": { + "External id": 442961,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007632727.952, "dur": 52.282, + "args": { + "External id": 442962,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007632802.463, "dur": 24.619, + "args": { + "External id": 442963,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5186 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.4)", "pid": 4183441, "tid": 4183441, + "ts": 676007632993.427, "dur": 80.075, + "args": { + "External id": 442964,"Record function id": 0, "Ev Idx": 5187 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007633169.180, "dur": 48.626, + "args": { + "External id": 442965,"Record function id": 0, "Ev Idx": 5188 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.5)", "pid": 4183441, "tid": 4183441, + "ts": 676007633227.480, "dur": 8814.959, + "args": { + "External id": 442966,"Record function id": 0, "Ev Idx": 5189 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 4183441, "tid": 4183441, + "ts": 676007633238.777, "dur": 938.906, + "args": { + "External id": 442967,"Record function id": 0, "Ev Idx": 5190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007633324.612, "dur": 8.412, + "args": { + "External id": 442968,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007633346.487, "dur": 40.527, + "args": { + "External id": 442969,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633353.629, "dur": 2.558, + "args": { + "External id": 442970,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633360.255, "dur": 0.443, + "args": { + "External id": 442971,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633363.886, "dur": 0.204, + "args": { + "External id": 442972,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633365.043, "dur": 0.606, + "args": { + "External id": 442973,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633368.470, "dur": 0.420, + "args": { + "External id": 442974,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633371.122, "dur": 0.521, + "args": { + "External id": 442975,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633372.307, "dur": 3.940, + "args": { + "External id": 442976,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633376.848, "dur": 0.317, + "args": { + "External id": 442977,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633380.175, "dur": 0.241, + "args": { + "External id": 442978,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007633399.923, "dur": 42.022, + "args": { + "External id": 442979,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007633475.666, "dur": 117.885, + "args": { + "External id": 442980,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007633489.857, "dur": 3.572, + "args": { + "External id": 442981,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007633499.262, "dur": 9.627, + "args": { + "External id": 442982,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007633503.970, "dur": 4.527, + "args": { + "External id": 442983,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633506.782, "dur": 0.644, + "args": { + "External id": 442984,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007633515.290, "dur": 32.410, + "args": { + "External id": 442985,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633519.128, "dur": 2.455, + "args": { + "External id": 442986,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633522.686, "dur": 0.504, + "args": { + "External id": 442987,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633524.055, "dur": 0.369, + "args": { + "External id": 442988,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633528.981, "dur": 1.546, + "args": { + "External id": 442989,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633531.168, "dur": 0.353, + "args": { + "External id": 442990,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633532.207, "dur": 0.670, + "args": { + "External id": 442991,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633536.883, "dur": 0.418, + "args": { + "External id": 442992,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633538.118, "dur": 0.420, + "args": { + "External id": 442993,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007633541.063, "dur": 2.660, + "args": { + "External id": 442994,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007633564.287, "dur": 21.874, + "args": { + "External id": 442995,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007633648.657, "dur": 412.953, + "args": { + "External id": 442996,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007633723.223, "dur": 332.839, + "args": { + "External id": 442997,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5220, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007633734.994, "dur": 315.913, + "args": { + "External id": 442998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007634101.438, "dur": 3.516, + "args": { + "External id": 442999,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5222, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 4183441, "tid": 4183441, + "ts": 676007634199.705, "dur": 7646.105, + "args": { + "External id": 443000,"Record function id": 0, "Ev Idx": 5223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634299.242, "dur": 6.782, + "args": { + "External id": 443001,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634310.028, "dur": 1.368, + "args": { + "External id": 443002,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634313.176, "dur": 3.237, + "args": { + "External id": 443003,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634317.844, "dur": 0.981, + "args": { + "External id": 443004,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634320.207, "dur": 0.989, + "args": { + "External id": 443005,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634322.355, "dur": 1.040, + "args": { + "External id": 443006,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634326.995, "dur": 0.996, + "args": { + "External id": 443007,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634329.275, "dur": 2.289, + "args": { + "External id": 443008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634332.868, "dur": 0.982, + "args": { + "External id": 443009,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007634335.191, "dur": 0.989, + "args": { + "External id": 443010,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007634356.943, "dur": 7439.270, + "args": { + "External id": 443011,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007634380.384, "dur": 7408.985, + "args": { + "External id": 443012,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007634395.478, "dur": 15.252, + "args": { + "External id": 443013,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007634413.532, "dur": 7343.348, + "args": { + "External id": 443014,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007634416.432, "dur": 7339.890, + "args": { + "External id": 443015,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007634423.348, "dur": 4.877, + "args": { + "External id": 443016,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007634429.928, "dur": 7323.405, + "args": { + "External id": 443017,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007641988.397, "dur": 29.058, + "args": { + "External id": 443018,"Sequence number": 5285399, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5241 + } + }, + { + "ph": "s", "id": 201, "pid": 4183441, "tid": 4183441, "ts": 676007641988.397, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007642004.969, "dur": 7.791, + "args": { + "External id": 443019,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007642008.247, "dur": 4.289, + "args": { + "External id": 443020,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007642099.561, "dur": 93.780, + "args": { + "External id": 443021,"Record function id": 0, "Ev Idx": 5244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007642195.735, "dur": 1099.160, + "args": { + "External id": 443022,"Record function id": 0, "Ev Idx": 5245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007642239.837, "dur": 1041.285, + "args": { + "External id": 443023,"Sequence number": 5285400, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5246 + } + }, + { + "ph": "s", "id": 200, "pid": 4183441, "tid": 4183441, "ts": 676007642239.837, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007642310.101, "dur": 44.680, + "args": { + "External id": 443024,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007642367.102, "dur": 93.895, + "args": { + "External id": 443025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007642470.777, "dur": 33.813, + "args": { + "External id": 443026,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007642514.514, "dur": 28.748, + "args": { + "External id": 443027,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007642567.449, "dur": 24.968, + "args": { + "External id": 443028,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007642609.693, "dur": 19.012, + "args": { + "External id": 443029,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007642694.201, "dur": 133.732, + "args": { + "External id": 443030,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007642746.592, "dur": 15.480, + "args": { + "External id": 443031,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007642751.865, "dur": 9.156, + "args": { + "External id": 443032,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007642764.849, "dur": 4.015, + "args": { + "External id": 443033,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007642770.308, "dur": 0.899, + "args": { + "External id": 443034,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007642773.714, "dur": 3.378, + "args": { + "External id": 443035,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007642839.021, "dur": 49.998, + "args": { + "External id": 443036,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007642924.155, "dur": 30.845, + "args": { + "External id": 443037,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007642962.797, "dur": 37.109, + "args": { + "External id": 443038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007643008.032, "dur": 33.953, + "args": { + "External id": 443039,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007643063.053, "dur": 46.808, + "args": { + "External id": 443040,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007643117.347, "dur": 51.575, + "args": { + "External id": 443041,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007643191.360, "dur": 19.996, + "args": { + "External id": 443042,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5265 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.5)", "pid": 4183441, "tid": 4183441, + "ts": 676007643361.159, "dur": 81.210, + "args": { + "External id": 443043,"Record function id": 0, "Ev Idx": 5266 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007643517.334, "dur": 48.637, + "args": { + "External id": 443044,"Record function id": 0, "Ev Idx": 5267 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.6)", "pid": 4183441, "tid": 4183441, + "ts": 676007643575.888, "dur": 8772.626, + "args": { + "External id": 443045,"Record function id": 0, "Ev Idx": 5268 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 4183441, "tid": 4183441, + "ts": 676007643583.777, "dur": 1017.443, + "args": { + "External id": 443046,"Record function id": 0, "Ev Idx": 5269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007643723.156, "dur": 9.767, + "args": { + "External id": 443047,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007643747.591, "dur": 40.671, + "args": { + "External id": 443048,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643753.190, "dur": 2.303, + "args": { + "External id": 443049,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643760.158, "dur": 0.422, + "args": { + "External id": 443050,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643762.374, "dur": 0.160, + "args": { + "External id": 443051,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643764.233, "dur": 0.394, + "args": { + "External id": 443052,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643767.959, "dur": 0.523, + "args": { + "External id": 443053,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643769.775, "dur": 0.353, + "args": { + "External id": 443054,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643771.960, "dur": 3.952, + "args": { + "External id": 443055,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643777.890, "dur": 0.576, + "args": { + "External id": 443056,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643780.240, "dur": 0.376, + "args": { + "External id": 443057,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007643801.569, "dur": 42.896, + "args": { + "External id": 443058,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007643880.834, "dur": 119.999, + "args": { + "External id": 443059,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007643894.179, "dur": 3.516, + "args": { + "External id": 443060,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007643903.291, "dur": 10.693, + "args": { + "External id": 443061,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007643907.610, "dur": 5.984, + "args": { + "External id": 443062,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643911.606, "dur": 0.552, + "args": { + "External id": 443063,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007643920.155, "dur": 36.494, + "args": { + "External id": 443064,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643922.534, "dur": 2.698, + "args": { + "External id": 443065,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643927.714, "dur": 0.245, + "args": { + "External id": 443066,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643930.288, "dur": 0.302, + "args": { + "External id": 443067,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643934.236, "dur": 1.268, + "args": { + "External id": 443068,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643937.013, "dur": 0.299, + "args": { + "External id": 443069,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643939.267, "dur": 0.273, + "args": { + "External id": 443070,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643943.630, "dur": 0.198, + "args": { + "External id": 443071,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643945.345, "dur": 0.324, + "args": { + "External id": 443072,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007643947.415, "dur": 2.012, + "args": { + "External id": 443073,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007643970.525, "dur": 21.469, + "args": { + "External id": 443074,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007644056.408, "dur": 446.037, + "args": { + "External id": 443075,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007644113.566, "dur": 383.469, + "args": { + "External id": 443076,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5299, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007644125.548, "dur": 365.810, + "args": { + "External id": 443077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007644526.428, "dur": 2.565, + "args": { + "External id": 443078,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5301, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 4183441, "tid": 4183441, + "ts": 676007644622.068, "dur": 7528.050, + "args": { + "External id": 443079,"Record function id": 0, "Ev Idx": 5302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644778.883, "dur": 7.113, + "args": { + "External id": 443080,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644790.380, "dur": 1.217, + "args": { + "External id": 443081,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644793.753, "dur": 2.374, + "args": { + "External id": 443082,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644797.909, "dur": 1.512, + "args": { + "External id": 443083,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644800.891, "dur": 1.219, + "args": { + "External id": 443084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644803.621, "dur": 0.980, + "args": { + "External id": 443085,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644808.013, "dur": 1.180, + "args": { + "External id": 443086,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644811.223, "dur": 2.857, + "args": { + "External id": 443087,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644815.682, "dur": 0.992, + "args": { + "External id": 443088,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007644818.517, "dur": 0.880, + "args": { + "External id": 443089,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007644840.503, "dur": 7254.704, + "args": { + "External id": 443090,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007644857.065, "dur": 7220.178, + "args": { + "External id": 443091,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007644877.391, "dur": 15.504, + "args": { + "External id": 443092,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007644895.784, "dur": 7149.189, + "args": { + "External id": 443093,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007644898.368, "dur": 7146.173, + "args": { + "External id": 443094,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007644904.424, "dur": 6.697, + "args": { + "External id": 443095,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007644912.924, "dur": 7128.867, + "args": { + "External id": 443096,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007652294.883, "dur": 29.237, + "args": { + "External id": 443097,"Sequence number": 5285401, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5320 + } + }, + { + "ph": "s", "id": 199, "pid": 4183441, "tid": 4183441, "ts": 676007652294.883, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007652311.454, "dur": 7.995, + "args": { + "External id": 443098,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007652314.764, "dur": 4.422, + "args": { + "External id": 443099,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007652389.107, "dur": 94.484, + "args": { + "External id": 443100,"Record function id": 0, "Ev Idx": 5323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007652485.655, "dur": 1085.573, + "args": { + "External id": 443101,"Record function id": 0, "Ev Idx": 5324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007652527.161, "dur": 1030.434, + "args": { + "External id": 443102,"Sequence number": 5285402, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5325 + } + }, + { + "ph": "s", "id": 198, "pid": 4183441, "tid": 4183441, "ts": 676007652527.161, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007652593.804, "dur": 42.160, + "args": { + "External id": 443103,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007652648.643, "dur": 131.367, + "args": { + "External id": 443104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007652793.559, "dur": 37.143, + "args": { + "External id": 443105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007652839.788, "dur": 29.949, + "args": { + "External id": 443106,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007652896.449, "dur": 29.383, + "args": { + "External id": 443107,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007652943.132, "dur": 16.491, + "args": { + "External id": 443108,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007652977.865, "dur": 150.916, + "args": { + "External id": 443109,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007653028.044, "dur": 11.903, + "args": { + "External id": 443110,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007653033.489, "dur": 5.505, + "args": { + "External id": 443111,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007653042.617, "dur": 6.323, + "args": { + "External id": 443112,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007653050.496, "dur": 0.841, + "args": { + "External id": 443113,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007653053.891, "dur": 3.775, + "args": { + "External id": 443114,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007653140.655, "dur": 50.984, + "args": { + "External id": 443115,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007653223.696, "dur": 31.876, + "args": { + "External id": 443116,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007653264.640, "dur": 37.565, + "args": { + "External id": 443117,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007653310.049, "dur": 31.734, + "args": { + "External id": 443118,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007653365.443, "dur": 26.791, + "args": { + "External id": 443119,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007653397.560, "dur": 47.657, + "args": { + "External id": 443120,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007653465.238, "dur": 17.629, + "args": { + "External id": 443121,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5344 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.6)", "pid": 4183441, "tid": 4183441, + "ts": 676007653635.327, "dur": 138.685, + "args": { + "External id": 443122,"Record function id": 0, "Ev Idx": 5345 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007653854.029, "dur": 49.140, + "args": { + "External id": 443123,"Record function id": 0, "Ev Idx": 5346 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.7)", "pid": 4183441, "tid": 4183441, + "ts": 676007653913.423, "dur": 8521.908, + "args": { + "External id": 443124,"Record function id": 0, "Ev Idx": 5347 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 4183441, "tid": 4183441, + "ts": 676007653921.275, "dur": 982.859, + "args": { + "External id": 443125,"Record function id": 0, "Ev Idx": 5348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007654006.405, "dur": 8.735, + "args": { + "External id": 443126,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007654028.706, "dur": 41.955, + "args": { + "External id": 443127,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654035.028, "dur": 2.613, + "args": { + "External id": 443128,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654042.668, "dur": 0.412, + "args": { + "External id": 443129,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654044.545, "dur": 0.391, + "args": { + "External id": 443130,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654046.650, "dur": 0.230, + "args": { + "External id": 443131,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654050.504, "dur": 0.289, + "args": { + "External id": 443132,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654052.239, "dur": 0.253, + "args": { + "External id": 443133,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654054.053, "dur": 3.833, + "args": { + "External id": 443134,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654059.729, "dur": 0.160, + "args": { + "External id": 443135,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654061.196, "dur": 0.307, + "args": { + "External id": 443136,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007654106.241, "dur": 44.967, + "args": { + "External id": 443137,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007654188.477, "dur": 128.460, + "args": { + "External id": 443138,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007654201.784, "dur": 4.820, + "args": { + "External id": 443139,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007654211.973, "dur": 11.018, + "args": { + "External id": 443140,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007654216.339, "dur": 6.259, + "args": { + "External id": 443141,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654220.303, "dur": 0.632, + "args": { + "External id": 443142,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007654230.157, "dur": 33.260, + "args": { + "External id": 443143,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654232.531, "dur": 2.633, + "args": { + "External id": 443144,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654236.829, "dur": 0.570, + "args": { + "External id": 443145,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654239.132, "dur": 0.287, + "args": { + "External id": 443146,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654243.438, "dur": 1.039, + "args": { + "External id": 443147,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654246.418, "dur": 0.279, + "args": { + "External id": 443148,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654248.465, "dur": 0.154, + "args": { + "External id": 443149,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654251.538, "dur": 0.154, + "args": { + "External id": 443150,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654253.312, "dur": 0.148, + "args": { + "External id": 443151,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007654254.913, "dur": 2.275, + "args": { + "External id": 443152,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007654280.163, "dur": 23.347, + "args": { + "External id": 443153,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007654370.295, "dur": 434.992, + "args": { + "External id": 443154,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007654402.989, "dur": 396.320, + "args": { + "External id": 443155,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5378, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007654414.161, "dur": 378.681, + "args": { + "External id": 443156,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007654829.595, "dur": 2.306, + "args": { + "External id": 443157,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5380, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 4183441, "tid": 4183441, + "ts": 676007654925.374, "dur": 7311.844, + "args": { + "External id": 443158,"Record function id": 0, "Ev Idx": 5381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655037.497, "dur": 6.669, + "args": { + "External id": 443159,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655047.665, "dur": 1.198, + "args": { + "External id": 443160,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655051.138, "dur": 2.512, + "args": { + "External id": 443161,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655057.166, "dur": 1.366, + "args": { + "External id": 443162,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655060.123, "dur": 1.143, + "args": { + "External id": 443163,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655063.138, "dur": 0.952, + "args": { + "External id": 443164,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655065.784, "dur": 1.136, + "args": { + "External id": 443165,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655069.878, "dur": 3.002, + "args": { + "External id": 443166,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655074.793, "dur": 0.997, + "args": { + "External id": 443167,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007655077.292, "dur": 0.890, + "args": { + "External id": 443168,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007655122.328, "dur": 7063.259, + "args": { + "External id": 443169,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007655139.550, "dur": 7039.117, + "args": { + "External id": 443170,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007655155.211, "dur": 15.758, + "args": { + "External id": 443171,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007655175.229, "dur": 6972.828, + "args": { + "External id": 443172,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007655177.966, "dur": 6969.640, + "args": { + "External id": 443173,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007655184.955, "dur": 6.909, + "args": { + "External id": 443174,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007655193.922, "dur": 6950.767, + "args": { + "External id": 443175,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007662380.598, "dur": 29.608, + "args": { + "External id": 443176,"Sequence number": 5285403, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5399 + } + }, + { + "ph": "s", "id": 197, "pid": 4183441, "tid": 4183441, "ts": 676007662380.598, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007662397.710, "dur": 7.846, + "args": { + "External id": 443177,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007662401.094, "dur": 4.228, + "args": { + "External id": 443178,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007662475.893, "dur": 94.054, + "args": { + "External id": 443179,"Record function id": 0, "Ev Idx": 5402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007662571.568, "dur": 1071.088, + "args": { + "External id": 443180,"Record function id": 0, "Ev Idx": 5403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007662614.283, "dur": 1014.571, + "args": { + "External id": 443181,"Sequence number": 5285404, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5404 + } + }, + { + "ph": "s", "id": 196, "pid": 4183441, "tid": 4183441, "ts": 676007662614.283, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007662714.869, "dur": 46.391, + "args": { + "External id": 443182,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007662775.507, "dur": 91.776, + "args": { + "External id": 443183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007662876.575, "dur": 33.866, + "args": { + "External id": 443184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007662919.177, "dur": 28.033, + "args": { + "External id": 443185,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007662970.917, "dur": 25.717, + "args": { + "External id": 443186,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007663015.809, "dur": 15.137, + "args": { + "External id": 443187,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007663050.002, "dur": 159.828, + "args": { + "External id": 443188,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007663118.337, "dur": 12.374, + "args": { + "External id": 443189,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007663123.544, "dur": 6.241, + "args": { + "External id": 443190,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007663134.155, "dur": 5.219, + "args": { + "External id": 443191,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007663148.172, "dur": 1.251, + "args": { + "External id": 443192,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007663152.284, "dur": 4.110, + "args": { + "External id": 443193,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007663220.827, "dur": 49.507, + "args": { + "External id": 443194,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007663301.612, "dur": 29.555, + "args": { + "External id": 443195,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007663340.351, "dur": 37.563, + "args": { + "External id": 443196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007663386.346, "dur": 30.524, + "args": { + "External id": 443197,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007663438.649, "dur": 27.976, + "args": { + "External id": 443198,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007663472.252, "dur": 44.844, + "args": { + "External id": 443199,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007663537.977, "dur": 19.852, + "args": { + "External id": 443200,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5423 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.7)", "pid": 4183441, "tid": 4183441, + "ts": 676007663746.837, "dur": 83.785, + "args": { + "External id": 443201,"Record function id": 0, "Ev Idx": 5424 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007663905.470, "dur": 47.650, + "args": { + "External id": 443202,"Record function id": 0, "Ev Idx": 5425 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.8)", "pid": 4183441, "tid": 4183441, + "ts": 676007663963.673, "dur": 8580.301, + "args": { + "External id": 443203,"Record function id": 0, "Ev Idx": 5426 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 4183441, "tid": 4183441, + "ts": 676007663972.557, "dur": 954.707, + "args": { + "External id": 443204,"Record function id": 0, "Ev Idx": 5427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007664058.628, "dur": 8.575, + "args": { + "External id": 443205,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007664096.392, "dur": 42.786, + "args": { + "External id": 443206,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664103.012, "dur": 2.496, + "args": { + "External id": 443207,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664110.634, "dur": 0.500, + "args": { + "External id": 443208,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664112.846, "dur": 0.385, + "args": { + "External id": 443209,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664115.005, "dur": 0.416, + "args": { + "External id": 443210,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664119.528, "dur": 0.564, + "args": { + "External id": 443211,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664121.630, "dur": 0.249, + "args": { + "External id": 443212,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664123.433, "dur": 3.821, + "args": { + "External id": 443213,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664129.138, "dur": 0.335, + "args": { + "External id": 443214,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664131.400, "dur": 0.314, + "args": { + "External id": 443215,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007664152.083, "dur": 44.269, + "args": { + "External id": 443216,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007664233.233, "dur": 123.071, + "args": { + "External id": 443217,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007664244.900, "dur": 4.410, + "args": { + "External id": 443218,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007664254.987, "dur": 10.815, + "args": { + "External id": 443219,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007664259.531, "dur": 5.880, + "args": { + "External id": 443220,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664263.629, "dur": 0.547, + "args": { + "External id": 443221,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007664273.893, "dur": 34.774, + "args": { + "External id": 443222,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664276.130, "dur": 2.983, + "args": { + "External id": 443223,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664280.516, "dur": 0.548, + "args": { + "External id": 443224,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664282.768, "dur": 0.311, + "args": { + "External id": 443225,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664286.987, "dur": 1.885, + "args": { + "External id": 443226,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664290.897, "dur": 0.157, + "args": { + "External id": 443227,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664292.529, "dur": 0.250, + "args": { + "External id": 443228,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664296.727, "dur": 0.402, + "args": { + "External id": 443229,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664298.747, "dur": 0.420, + "args": { + "External id": 443230,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007664300.886, "dur": 2.582, + "args": { + "External id": 443231,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007664323.626, "dur": 23.622, + "args": { + "External id": 443232,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007664412.940, "dur": 413.078, + "args": { + "External id": 443233,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007664442.797, "dur": 377.450, + "args": { + "External id": 443234,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5457, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007664453.792, "dur": 359.956, + "args": { + "External id": 443235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007664851.984, "dur": 2.423, + "args": { + "External id": 443236,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5459, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 4183441, "tid": 4183441, + "ts": 676007664948.076, "dur": 7395.123, + "args": { + "External id": 443237,"Record function id": 0, "Ev Idx": 5460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665052.443, "dur": 6.554, + "args": { + "External id": 443238,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665062.964, "dur": 1.297, + "args": { + "External id": 443239,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665066.008, "dur": 2.802, + "args": { + "External id": 443240,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665070.556, "dur": 1.138, + "args": { + "External id": 443241,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665073.536, "dur": 0.849, + "args": { + "External id": 443242,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665077.079, "dur": 0.850, + "args": { + "External id": 443243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665079.730, "dur": 0.934, + "args": { + "External id": 443244,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665099.652, "dur": 2.889, + "args": { + "External id": 443245,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665105.829, "dur": 0.828, + "args": { + "External id": 443246,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007665109.031, "dur": 0.680, + "args": { + "External id": 443247,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007665141.708, "dur": 7150.212, + "args": { + "External id": 443248,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007665159.422, "dur": 7126.085, + "args": { + "External id": 443249,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007665175.650, "dur": 15.040, + "args": { + "External id": 443250,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007665193.454, "dur": 7057.222, + "args": { + "External id": 443251,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007665196.076, "dur": 7054.082, + "args": { + "External id": 443252,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007665202.610, "dur": 7.023, + "args": { + "External id": 443253,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007665211.770, "dur": 7035.728, + "args": { + "External id": 443254,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007672489.991, "dur": 29.538, + "args": { + "External id": 443255,"Sequence number": 5285405, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5478 + } + }, + { + "ph": "s", "id": 195, "pid": 4183441, "tid": 4183441, "ts": 676007672489.991, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007672506.672, "dur": 8.197, + "args": { + "External id": 443256,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007672510.304, "dur": 4.305, + "args": { + "External id": 443257,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007672583.899, "dur": 134.319, + "args": { + "External id": 443258,"Record function id": 0, "Ev Idx": 5481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007672721.610, "dur": 1085.826, + "args": { + "External id": 443259,"Record function id": 0, "Ev Idx": 5482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007672764.754, "dur": 1028.468, + "args": { + "External id": 443260,"Sequence number": 5285406, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5483 + } + }, + { + "ph": "s", "id": 194, "pid": 4183441, "tid": 4183441, "ts": 676007672764.754, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007672831.492, "dur": 44.443, + "args": { + "External id": 443261,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007672888.918, "dur": 93.936, + "args": { + "External id": 443262,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007672993.335, "dur": 34.160, + "args": { + "External id": 443263,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007673035.893, "dur": 29.090, + "args": { + "External id": 443264,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007673107.711, "dur": 31.225, + "args": { + "External id": 443265,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007673158.932, "dur": 15.572, + "args": { + "External id": 443266,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007673195.649, "dur": 133.862, + "args": { + "External id": 443267,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007673247.708, "dur": 12.677, + "args": { + "External id": 443268,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007673252.803, "dur": 6.788, + "args": { + "External id": 443269,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007673263.193, "dur": 5.558, + "args": { + "External id": 443270,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007673270.012, "dur": 1.427, + "args": { + "External id": 443271,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007673273.771, "dur": 4.565, + "args": { + "External id": 443272,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007673339.094, "dur": 51.603, + "args": { + "External id": 443273,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007673419.839, "dur": 29.252, + "args": { + "External id": 443274,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007673458.708, "dur": 38.180, + "args": { + "External id": 443275,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007673505.619, "dur": 30.927, + "args": { + "External id": 443276,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007673558.102, "dur": 27.600, + "args": { + "External id": 443277,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007673591.474, "dur": 42.358, + "args": { + "External id": 443278,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007673653.930, "dur": 57.963, + "args": { + "External id": 443279,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5502 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.8)", "pid": 4183441, "tid": 4183441, + "ts": 676007673872.884, "dur": 84.494, + "args": { + "External id": 443280,"Record function id": 0, "Ev Idx": 5503 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007674031.586, "dur": 49.318, + "args": { + "External id": 443281,"Record function id": 0, "Ev Idx": 5504 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.9)", "pid": 4183441, "tid": 4183441, + "ts": 676007674111.796, "dur": 8954.009, + "args": { + "External id": 443282,"Record function id": 0, "Ev Idx": 5505 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 4183441, "tid": 4183441, + "ts": 676007674120.804, "dur": 939.597, + "args": { + "External id": 443283,"Record function id": 0, "Ev Idx": 5506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007674207.188, "dur": 10.203, + "args": { + "External id": 443284,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007674230.981, "dur": 38.917, + "args": { + "External id": 443285,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674236.348, "dur": 2.542, + "args": { + "External id": 443286,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674243.693, "dur": 0.573, + "args": { + "External id": 443287,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674245.882, "dur": 0.705, + "args": { + "External id": 443288,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674247.645, "dur": 0.552, + "args": { + "External id": 443289,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674251.438, "dur": 0.716, + "args": { + "External id": 443290,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674253.309, "dur": 0.447, + "args": { + "External id": 443291,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674254.718, "dur": 3.982, + "args": { + "External id": 443292,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674260.247, "dur": 0.555, + "args": { + "External id": 443293,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674262.195, "dur": 0.481, + "args": { + "External id": 443294,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007674282.915, "dur": 43.958, + "args": { + "External id": 443295,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007674360.560, "dur": 128.979, + "args": { + "External id": 443296,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007674371.221, "dur": 4.066, + "args": { + "External id": 443297,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007674381.132, "dur": 11.072, + "args": { + "External id": 443298,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007674386.106, "dur": 5.674, + "args": { + "External id": 443299,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674389.984, "dur": 0.548, + "args": { + "External id": 443300,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007674398.354, "dur": 33.454, + "args": { + "External id": 443301,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674400.382, "dur": 2.749, + "args": { + "External id": 443302,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674408.368, "dur": 0.563, + "args": { + "External id": 443303,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674410.008, "dur": 0.601, + "args": { + "External id": 443304,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674414.039, "dur": 1.403, + "args": { + "External id": 443305,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674416.588, "dur": 0.449, + "args": { + "External id": 443306,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674418.706, "dur": 1.333, + "args": { + "External id": 443307,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674421.409, "dur": 0.372, + "args": { + "External id": 443308,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674422.902, "dur": 0.357, + "args": { + "External id": 443309,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007674427.084, "dur": 0.222, + "args": { + "External id": 443310,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007674453.298, "dur": 28.153, + "args": { + "External id": 443311,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007674544.313, "dur": 417.676, + "args": { + "External id": 443312,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007674571.982, "dur": 384.345, + "args": { + "External id": 443313,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5536, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007674584.145, "dur": 365.129, + "args": { + "External id": 443314,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007674984.061, "dur": 2.473, + "args": { + "External id": 443315,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5538, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 4183441, "tid": 4183441, + "ts": 676007675080.251, "dur": 7792.683, + "args": { + "External id": 443316,"Record function id": 0, "Ev Idx": 5539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675209.621, "dur": 7.206, + "args": { + "External id": 443317,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675220.665, "dur": 1.290, + "args": { + "External id": 443318,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675223.822, "dur": 3.023, + "args": { + "External id": 443319,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675228.473, "dur": 1.047, + "args": { + "External id": 443320,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675231.586, "dur": 1.039, + "args": { + "External id": 443321,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675234.265, "dur": 0.953, + "args": { + "External id": 443322,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675237.699, "dur": 0.742, + "args": { + "External id": 443323,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675239.958, "dur": 2.167, + "args": { + "External id": 443324,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675243.973, "dur": 0.925, + "args": { + "External id": 443325,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007675246.406, "dur": 0.643, + "args": { + "External id": 443326,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007675265.072, "dur": 7556.814, + "args": { + "External id": 443327,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007675280.977, "dur": 7533.962, + "args": { + "External id": 443328,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007675298.470, "dur": 15.400, + "args": { + "External id": 443329,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007675316.764, "dur": 7466.546, + "args": { + "External id": 443330,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007675319.417, "dur": 7463.309, + "args": { + "External id": 443331,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007675325.368, "dur": 7.545, + "args": { + "External id": 443332,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007675334.861, "dur": 7444.905, + "args": { + "External id": 443333,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007683011.782, "dur": 28.985, + "args": { + "External id": 443334,"Sequence number": 5285407, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5557 + } + }, + { + "ph": "s", "id": 193, "pid": 4183441, "tid": 4183441, "ts": 676007683011.782, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007683028.077, "dur": 8.145, + "args": { + "External id": 443335,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007683031.572, "dur": 4.414, + "args": { + "External id": 443336,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007683124.006, "dur": 92.369, + "args": { + "External id": 443337,"Record function id": 0, "Ev Idx": 5560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007683218.629, "dur": 1115.432, + "args": { + "External id": 443338,"Record function id": 0, "Ev Idx": 5561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007683259.993, "dur": 1060.141, + "args": { + "External id": 443339,"Sequence number": 5285408, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5562 + } + }, + { + "ph": "s", "id": 192, "pid": 4183441, "tid": 4183441, "ts": 676007683259.993, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007683326.995, "dur": 42.631, + "args": { + "External id": 443340,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007683382.559, "dur": 92.120, + "args": { + "External id": 443341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007683484.410, "dur": 34.974, + "args": { + "External id": 443342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007683528.103, "dur": 29.966, + "args": { + "External id": 443343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007683581.947, "dur": 28.417, + "args": { + "External id": 443344,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007683627.795, "dur": 15.847, + "args": { + "External id": 443345,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007683712.706, "dur": 140.423, + "args": { + "External id": 443346,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007683767.130, "dur": 13.588, + "args": { + "External id": 443347,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007683772.449, "dur": 7.173, + "args": { + "External id": 443348,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007683783.687, "dur": 6.115, + "args": { + "External id": 443349,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007683791.455, "dur": 1.343, + "args": { + "External id": 443350,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007683795.798, "dur": 4.089, + "args": { + "External id": 443351,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007683864.443, "dur": 52.637, + "args": { + "External id": 443352,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007683950.009, "dur": 29.074, + "args": { + "External id": 443353,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007683995.676, "dur": 40.082, + "args": { + "External id": 443354,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007684045.056, "dur": 55.087, + "args": { + "External id": 443355,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007684125.170, "dur": 30.624, + "args": { + "External id": 443356,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007684162.317, "dur": 44.768, + "args": { + "External id": 443357,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007684226.945, "dur": 20.303, + "args": { + "External id": 443358,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5581 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.9)", "pid": 4183441, "tid": 4183441, + "ts": 676007684399.044, "dur": 80.531, + "args": { + "External id": 443359,"Record function id": 0, "Ev Idx": 5582 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007684550.292, "dur": 47.609, + "args": { + "External id": 443360,"Record function id": 0, "Ev Idx": 5583 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.10)", "pid": 4183441, "tid": 4183441, + "ts": 676007684606.433, "dur": 9342.733, + "args": { + "External id": 443361,"Record function id": 0, "Ev Idx": 5584 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 4183441, "tid": 4183441, + "ts": 676007684615.727, "dur": 970.600, + "args": { + "External id": 443362,"Record function id": 0, "Ev Idx": 5585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007684748.970, "dur": 10.774, + "args": { + "External id": 443363,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007684774.107, "dur": 42.190, + "args": { + "External id": 443364,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684779.792, "dur": 2.523, + "args": { + "External id": 443365,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684787.383, "dur": 0.242, + "args": { + "External id": 443366,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684789.869, "dur": 0.516, + "args": { + "External id": 443367,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684792.137, "dur": 0.696, + "args": { + "External id": 443368,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684796.847, "dur": 0.226, + "args": { + "External id": 443369,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684798.769, "dur": 0.494, + "args": { + "External id": 443370,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684801.395, "dur": 3.530, + "args": { + "External id": 443371,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684806.537, "dur": 0.297, + "args": { + "External id": 443372,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684808.664, "dur": 0.392, + "args": { + "External id": 443373,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007684829.480, "dur": 42.821, + "args": { + "External id": 443374,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007684907.288, "dur": 116.556, + "args": { + "External id": 443375,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007684918.202, "dur": 3.920, + "args": { + "External id": 443376,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007684927.670, "dur": 11.618, + "args": { + "External id": 443377,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007684932.348, "dur": 6.507, + "args": { + "External id": 443378,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684937.022, "dur": 0.546, + "args": { + "External id": 443379,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007684946.339, "dur": 34.948, + "args": { + "External id": 443380,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684948.442, "dur": 2.890, + "args": { + "External id": 443381,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684953.334, "dur": 0.607, + "args": { + "External id": 443382,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684956.018, "dur": 0.373, + "args": { + "External id": 443383,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684959.782, "dur": 1.587, + "args": { + "External id": 443384,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684963.619, "dur": 0.256, + "args": { + "External id": 443385,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684965.852, "dur": 0.355, + "args": { + "External id": 443386,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684970.321, "dur": 0.373, + "args": { + "External id": 443387,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684972.140, "dur": 0.415, + "args": { + "External id": 443388,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007684974.234, "dur": 2.295, + "args": { + "External id": 443389,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007684993.376, "dur": 22.834, + "args": { + "External id": 443390,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007685076.604, "dur": 415.751, + "args": { + "External id": 443391,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007685120.532, "dur": 366.411, + "args": { + "External id": 443392,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5615, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007685154.440, "dur": 326.982, + "args": { + "External id": 443393,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007685513.090, "dur": 2.322, + "args": { + "External id": 443394,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5617, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 4183441, "tid": 4183441, + "ts": 676007685606.765, "dur": 8138.287, + "args": { + "External id": 443395,"Record function id": 0, "Ev Idx": 5618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685745.441, "dur": 6.984, + "args": { + "External id": 443396,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685756.032, "dur": 0.943, + "args": { + "External id": 443397,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685758.548, "dur": 2.184, + "args": { + "External id": 443398,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685762.508, "dur": 0.684, + "args": { + "External id": 443399,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685765.036, "dur": 0.759, + "args": { + "External id": 443400,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685767.335, "dur": 1.151, + "args": { + "External id": 443401,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685770.287, "dur": 1.684, + "args": { + "External id": 443402,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685773.690, "dur": 1.816, + "args": { + "External id": 443403,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685777.101, "dur": 0.515, + "args": { + "External id": 443404,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007685779.581, "dur": 0.503, + "args": { + "External id": 443405,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007685801.045, "dur": 7906.281, + "args": { + "External id": 443406,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007685817.785, "dur": 7882.483, + "args": { + "External id": 443407,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007685835.311, "dur": 17.158, + "args": { + "External id": 443408,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007685855.356, "dur": 7777.129, + "args": { + "External id": 443409,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007685858.017, "dur": 7774.014, + "args": { + "External id": 443410,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007685864.665, "dur": 7.042, + "args": { + "External id": 443411,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007685873.582, "dur": 7755.490, + "args": { + "External id": 443412,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007693884.535, "dur": 40.822, + "args": { + "External id": 443413,"Sequence number": 5285409, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5636 + } + }, + { + "ph": "s", "id": 191, "pid": 4183441, "tid": 4183441, "ts": 676007693884.535, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007693913.167, "dur": 7.478, + "args": { + "External id": 443414,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007693916.550, "dur": 3.837, + "args": { + "External id": 443415,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007693989.365, "dur": 105.787, + "args": { + "External id": 443416,"Record function id": 0, "Ev Idx": 5639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007694098.084, "dur": 1130.000, + "args": { + "External id": 443417,"Record function id": 0, "Ev Idx": 5640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007694139.282, "dur": 1074.147, + "args": { + "External id": 443418,"Sequence number": 5285410, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5641 + } + }, + { + "ph": "s", "id": 190, "pid": 4183441, "tid": 4183441, "ts": 676007694139.282, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007694208.767, "dur": 43.100, + "args": { + "External id": 443419,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007694264.371, "dur": 95.638, + "args": { + "External id": 443420,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007694370.137, "dur": 34.277, + "args": { + "External id": 443421,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007694413.306, "dur": 28.364, + "args": { + "External id": 443422,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007694465.324, "dur": 26.766, + "args": { + "External id": 443423,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007694509.440, "dur": 15.313, + "args": { + "External id": 443424,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007694544.197, "dur": 183.286, + "args": { + "External id": 443425,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007694592.668, "dur": 11.680, + "args": { + "External id": 443426,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007694597.990, "dur": 5.423, + "args": { + "External id": 443427,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007694607.156, "dur": 5.393, + "args": { + "External id": 443428,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007694614.033, "dur": 1.157, + "args": { + "External id": 443429,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007694617.653, "dur": 3.922, + "args": { + "External id": 443430,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007694741.189, "dur": 58.494, + "args": { + "External id": 443431,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007694831.595, "dur": 30.071, + "args": { + "External id": 443432,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007694870.588, "dur": 38.045, + "args": { + "External id": 443433,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007694917.628, "dur": 50.765, + "args": { + "External id": 443434,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007694991.065, "dur": 28.330, + "args": { + "External id": 443435,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007695024.484, "dur": 53.683, + "args": { + "External id": 443436,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007695115.342, "dur": 22.062, + "args": { + "External id": 443437,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5660 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.10)", "pid": 4183441, "tid": 4183441, + "ts": 676007695293.276, "dur": 80.469, + "args": { + "External id": 443438,"Record function id": 0, "Ev Idx": 5661 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007695446.601, "dur": 49.290, + "args": { + "External id": 443439,"Record function id": 0, "Ev Idx": 5662 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.11)", "pid": 4183441, "tid": 4183441, + "ts": 676007695505.486, "dur": 8926.069, + "args": { + "External id": 443440,"Record function id": 0, "Ev Idx": 5663 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 4183441, "tid": 4183441, + "ts": 676007695515.695, "dur": 991.703, + "args": { + "External id": 443441,"Record function id": 0, "Ev Idx": 5664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007695599.988, "dur": 8.901, + "args": { + "External id": 443442,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007695622.354, "dur": 85.024, + "args": { + "External id": 443443,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695628.318, "dur": 2.338, + "args": { + "External id": 443444,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695635.325, "dur": 0.266, + "args": { + "External id": 443445,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695637.409, "dur": 0.648, + "args": { + "External id": 443446,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695640.122, "dur": 0.303, + "args": { + "External id": 443447,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695644.228, "dur": 0.502, + "args": { + "External id": 443448,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695646.219, "dur": 0.595, + "args": { + "External id": 443449,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695648.325, "dur": 45.363, + "args": { + "External id": 443450,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695697.336, "dur": 0.506, + "args": { + "External id": 443451,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695699.976, "dur": 0.344, + "args": { + "External id": 443452,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007695724.719, "dur": 41.945, + "args": { + "External id": 443453,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007695801.958, "dur": 120.426, + "args": { + "External id": 443454,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007695812.936, "dur": 7.720, + "args": { + "External id": 443455,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007695826.349, "dur": 10.854, + "args": { + "External id": 443456,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007695831.097, "dur": 5.680, + "args": { + "External id": 443457,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695834.812, "dur": 0.656, + "args": { + "External id": 443458,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007695845.350, "dur": 32.448, + "args": { + "External id": 443459,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695847.724, "dur": 0.559, + "args": { + "External id": 443460,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695850.243, "dur": 2.561, + "args": { + "External id": 443461,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695854.830, "dur": 0.411, + "args": { + "External id": 443462,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695856.982, "dur": 1.907, + "args": { + "External id": 443463,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695863.259, "dur": 0.166, + "args": { + "External id": 443464,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695864.988, "dur": 0.516, + "args": { + "External id": 443465,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695867.035, "dur": 0.180, + "args": { + "External id": 443466,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695870.825, "dur": 0.404, + "args": { + "External id": 443467,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007695872.834, "dur": 0.158, + "args": { + "External id": 443468,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007695891.587, "dur": 22.936, + "args": { + "External id": 443469,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007695979.198, "dur": 428.648, + "args": { + "External id": 443470,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007696006.956, "dur": 395.039, + "args": { + "External id": 443471,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5694, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007696017.779, "dur": 378.271, + "args": { + "External id": 443472,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007696431.072, "dur": 2.733, + "args": { + "External id": 443473,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5696, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 4183441, "tid": 4183441, + "ts": 676007696529.467, "dur": 7697.121, + "args": { + "External id": 443474,"Record function id": 0, "Ev Idx": 5697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696635.684, "dur": 6.371, + "args": { + "External id": 443475,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696645.593, "dur": 1.443, + "args": { + "External id": 443476,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696648.864, "dur": 40.028, + "args": { + "External id": 443477,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696693.507, "dur": 1.266, + "args": { + "External id": 443478,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696696.842, "dur": 1.355, + "args": { + "External id": 443479,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696699.961, "dur": 1.007, + "args": { + "External id": 443480,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696702.956, "dur": 0.953, + "args": { + "External id": 443481,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696705.592, "dur": 2.928, + "args": { + "External id": 443482,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696710.441, "dur": 0.777, + "args": { + "External id": 443483,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007696712.995, "dur": 0.779, + "args": { + "External id": 443484,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007696735.265, "dur": 7452.431, + "args": { + "External id": 443485,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007696752.297, "dur": 7428.820, + "args": { + "External id": 443486,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007696774.738, "dur": 14.074, + "args": { + "External id": 443487,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007696791.481, "dur": 7356.638, + "args": { + "External id": 443488,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007696794.715, "dur": 7352.936, + "args": { + "External id": 443489,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007696801.391, "dur": 5.975, + "args": { + "External id": 443490,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007696809.119, "dur": 7335.725, + "args": { + "External id": 443491,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007704363.959, "dur": 43.325, + "args": { + "External id": 443492,"Sequence number": 5285411, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5715 + } + }, + { + "ph": "s", "id": 189, "pid": 4183441, "tid": 4183441, "ts": 676007704363.959, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007704394.287, "dur": 7.803, + "args": { + "External id": 443493,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007704397.646, "dur": 4.239, + "args": { + "External id": 443494,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007704471.534, "dur": 92.468, + "args": { + "External id": 443495,"Record function id": 0, "Ev Idx": 5718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007704565.896, "dur": 1081.516, + "args": { + "External id": 443496,"Record function id": 0, "Ev Idx": 5719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007704607.813, "dur": 1025.805, + "args": { + "External id": 443497,"Sequence number": 5285412, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5720 + } + }, + { + "ph": "s", "id": 188, "pid": 4183441, "tid": 4183441, "ts": 676007704607.813, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007704708.038, "dur": 45.722, + "args": { + "External id": 443498,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007704768.784, "dur": 94.514, + "args": { + "External id": 443499,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007704873.383, "dur": 35.993, + "args": { + "External id": 443500,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007704918.720, "dur": 28.897, + "args": { + "External id": 443501,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007704971.608, "dur": 25.516, + "args": { + "External id": 443502,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007705014.066, "dur": 16.755, + "args": { + "External id": 443503,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007705049.276, "dur": 154.106, + "args": { + "External id": 443504,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007705116.567, "dur": 13.927, + "args": { + "External id": 443505,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007705122.674, "dur": 6.644, + "args": { + "External id": 443506,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007705133.380, "dur": 5.665, + "args": { + "External id": 443507,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007705140.376, "dur": 1.102, + "args": { + "External id": 443508,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007705143.992, "dur": 4.217, + "args": { + "External id": 443509,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007705214.545, "dur": 48.801, + "args": { + "External id": 443510,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007705293.983, "dur": 30.252, + "args": { + "External id": 443511,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007705333.044, "dur": 38.334, + "args": { + "External id": 443512,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007705380.241, "dur": 30.973, + "args": { + "External id": 443513,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007705433.191, "dur": 30.833, + "args": { + "External id": 443514,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007705469.929, "dur": 45.815, + "args": { + "External id": 443515,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007705534.613, "dur": 20.036, + "args": { + "External id": 443516,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5739 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.11)", "pid": 4183441, "tid": 4183441, + "ts": 676007705751.656, "dur": 81.777, + "args": { + "External id": 443517,"Record function id": 0, "Ev Idx": 5740 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007705908.188, "dur": 46.870, + "args": { + "External id": 443518,"Record function id": 0, "Ev Idx": 5741 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.12)", "pid": 4183441, "tid": 4183441, + "ts": 676007705965.604, "dur": 9052.240, + "args": { + "External id": 443519,"Record function id": 0, "Ev Idx": 5742 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 4183441, "tid": 4183441, + "ts": 676007705975.668, "dur": 933.648, + "args": { + "External id": 443520,"Record function id": 0, "Ev Idx": 5743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007706058.359, "dur": 9.675, + "args": { + "External id": 443521,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007706099.508, "dur": 42.412, + "args": { + "External id": 443522,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706105.660, "dur": 2.280, + "args": { + "External id": 443523,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706112.987, "dur": 0.455, + "args": { + "External id": 443524,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706115.058, "dur": 0.384, + "args": { + "External id": 443525,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706117.309, "dur": 2.530, + "args": { + "External id": 443526,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706121.389, "dur": 0.207, + "args": { + "External id": 443527,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706123.459, "dur": 0.396, + "args": { + "External id": 443528,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706127.782, "dur": 2.113, + "args": { + "External id": 443529,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706131.962, "dur": 0.304, + "args": { + "External id": 443530,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706133.907, "dur": 0.484, + "args": { + "External id": 443531,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007706154.317, "dur": 44.410, + "args": { + "External id": 443532,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007706234.566, "dur": 121.754, + "args": { + "External id": 443533,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007706245.779, "dur": 5.217, + "args": { + "External id": 443534,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007706256.642, "dur": 13.134, + "args": { + "External id": 443535,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007706260.995, "dur": 8.343, + "args": { + "External id": 443536,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706264.838, "dur": 3.217, + "args": { + "External id": 443537,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007706277.532, "dur": 33.916, + "args": { + "External id": 443538,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706280.953, "dur": 0.539, + "args": { + "External id": 443539,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706283.090, "dur": 0.791, + "args": { + "External id": 443540,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706285.824, "dur": 0.601, + "args": { + "External id": 443541,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706290.116, "dur": 1.788, + "args": { + "External id": 443542,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706293.312, "dur": 0.444, + "args": { + "External id": 443543,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706295.225, "dur": 2.724, + "args": { + "External id": 443544,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706299.889, "dur": 0.575, + "args": { + "External id": 443545,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706302.183, "dur": 0.229, + "args": { + "External id": 443546,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007706306.723, "dur": 0.371, + "args": { + "External id": 443547,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007706324.362, "dur": 23.678, + "args": { + "External id": 443548,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007706409.985, "dur": 405.123, + "args": { + "External id": 443549,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007706437.570, "dur": 372.178, + "args": { + "External id": 443550,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5773, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007706448.508, "dur": 355.619, + "args": { + "External id": 443551,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007706838.025, "dur": 2.306, + "args": { + "External id": 443552,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5775, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 4183441, "tid": 4183441, + "ts": 676007706930.437, "dur": 7883.633, + "args": { + "External id": 443553,"Record function id": 0, "Ev Idx": 5776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707033.202, "dur": 6.385, + "args": { + "External id": 443554,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707042.729, "dur": 1.018, + "args": { + "External id": 443555,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707045.201, "dur": 2.585, + "args": { + "External id": 443556,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707049.446, "dur": 0.887, + "args": { + "External id": 443557,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707051.770, "dur": 1.105, + "args": { + "External id": 443558,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707054.478, "dur": 1.146, + "args": { + "External id": 443559,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707057.419, "dur": 1.345, + "args": { + "External id": 443560,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707060.702, "dur": 1.957, + "args": { + "External id": 443561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707064.582, "dur": 0.869, + "args": { + "External id": 443562,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007707067.273, "dur": 0.791, + "args": { + "External id": 443563,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007707104.500, "dur": 7672.023, + "args": { + "External id": 443564,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007707120.408, "dur": 7648.997, + "args": { + "External id": 443565,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007707141.876, "dur": 15.555, + "args": { + "External id": 443566,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007707160.431, "dur": 7575.964, + "args": { + "External id": 443567,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007707163.056, "dur": 7572.793, + "args": { + "External id": 443568,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007707169.219, "dur": 7.460, + "args": { + "External id": 443569,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007707178.452, "dur": 7554.296, + "args": { + "External id": 443570,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007714952.260, "dur": 41.854, + "args": { + "External id": 443571,"Sequence number": 5285413, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5794 + } + }, + { + "ph": "s", "id": 187, "pid": 4183441, "tid": 4183441, "ts": 676007714952.260, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007714980.777, "dur": 8.141, + "args": { + "External id": 443572,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007714984.108, "dur": 4.553, + "args": { + "External id": 443573,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007715058.271, "dur": 107.969, + "args": { + "External id": 443574,"Record function id": 0, "Ev Idx": 5797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007715169.175, "dur": 1114.712, + "args": { + "External id": 443575,"Record function id": 0, "Ev Idx": 5798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007715212.865, "dur": 1055.857, + "args": { + "External id": 443576,"Sequence number": 5285414, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5799 + } + }, + { + "ph": "s", "id": 186, "pid": 4183441, "tid": 4183441, "ts": 676007715212.865, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007715279.676, "dur": 45.061, + "args": { + "External id": 443577,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007715337.170, "dur": 93.961, + "args": { + "External id": 443578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007715441.146, "dur": 35.920, + "args": { + "External id": 443579,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007715485.488, "dur": 29.723, + "args": { + "External id": 443580,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007715538.783, "dur": 29.381, + "args": { + "External id": 443581,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007715585.364, "dur": 15.771, + "args": { + "External id": 443582,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007715621.483, "dur": 179.614, + "args": { + "External id": 443583,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007715715.994, "dur": 13.327, + "args": { + "External id": 443584,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007715721.481, "dur": 6.811, + "args": { + "External id": 443585,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007715732.328, "dur": 5.618, + "args": { + "External id": 443586,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007715739.279, "dur": 1.186, + "args": { + "External id": 443587,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007715742.760, "dur": 3.800, + "args": { + "External id": 443588,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007715811.748, "dur": 53.031, + "args": { + "External id": 443589,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007715895.719, "dur": 31.704, + "args": { + "External id": 443590,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007715934.992, "dur": 37.768, + "args": { + "External id": 443591,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007715981.913, "dur": 38.378, + "args": { + "External id": 443592,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007716051.223, "dur": 44.427, + "args": { + "External id": 443593,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007716107.120, "dur": 53.830, + "args": { + "External id": 443594,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007716180.088, "dur": 20.059, + "args": { + "External id": 443595,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5818 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.12)", "pid": 4183441, "tid": 4183441, + "ts": 676007716351.147, "dur": 83.147, + "args": { + "External id": 443596,"Record function id": 0, "Ev Idx": 5819 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007716505.980, "dur": 46.235, + "args": { + "External id": 443597,"Record function id": 0, "Ev Idx": 5820 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.13)", "pid": 4183441, "tid": 4183441, + "ts": 676007716561.192, "dur": 9073.175, + "args": { + "External id": 443598,"Record function id": 0, "Ev Idx": 5821 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 4183441, "tid": 4183441, + "ts": 676007716570.555, "dur": 917.692, + "args": { + "External id": 443599,"Record function id": 0, "Ev Idx": 5822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007716692.887, "dur": 10.620, + "args": { + "External id": 443600,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007716717.929, "dur": 38.178, + "args": { + "External id": 443601,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716723.494, "dur": 2.569, + "args": { + "External id": 443602,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716731.087, "dur": 0.591, + "args": { + "External id": 443603,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716732.725, "dur": 0.745, + "args": { + "External id": 443604,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716734.840, "dur": 1.031, + "args": { + "External id": 443605,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716738.914, "dur": 0.963, + "args": { + "External id": 443606,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716741.127, "dur": 0.736, + "args": { + "External id": 443607,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716742.729, "dur": 2.540, + "args": { + "External id": 443608,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716747.022, "dur": 0.762, + "args": { + "External id": 443609,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716748.848, "dur": 0.547, + "args": { + "External id": 443610,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007716769.355, "dur": 42.747, + "args": { + "External id": 443611,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007716845.342, "dur": 116.022, + "args": { + "External id": 443612,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007716856.514, "dur": 5.281, + "args": { + "External id": 443613,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007716867.353, "dur": 10.602, + "args": { + "External id": 443614,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007716871.978, "dur": 5.567, + "args": { + "External id": 443615,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716875.197, "dur": 0.824, + "args": { + "External id": 443616,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007716885.083, "dur": 31.703, + "args": { + "External id": 443617,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716887.001, "dur": 3.101, + "args": { + "External id": 443618,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716891.317, "dur": 0.637, + "args": { + "External id": 443619,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716893.273, "dur": 0.682, + "args": { + "External id": 443620,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716897.010, "dur": 0.407, + "args": { + "External id": 443621,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716898.861, "dur": 0.664, + "args": { + "External id": 443622,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716900.700, "dur": 0.837, + "args": { + "External id": 443623,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716905.021, "dur": 0.637, + "args": { + "External id": 443624,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716906.622, "dur": 0.626, + "args": { + "External id": 443625,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007716908.446, "dur": 2.467, + "args": { + "External id": 443626,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007716929.713, "dur": 24.191, + "args": { + "External id": 443627,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007717015.840, "dur": 379.625, + "args": { + "External id": 443628,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007717041.653, "dur": 348.266, + "args": { + "External id": 443629,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5852, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007717052.432, "dur": 331.159, + "args": { + "External id": 443630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007717417.062, "dur": 2.457, + "args": { + "External id": 443631,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5854, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 4183441, "tid": 4183441, + "ts": 676007717509.624, "dur": 7917.116, + "args": { + "External id": 443632,"Record function id": 0, "Ev Idx": 5855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717607.524, "dur": 6.189, + "args": { + "External id": 443633,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717617.228, "dur": 1.602, + "args": { + "External id": 443634,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717620.543, "dur": 0.963, + "args": { + "External id": 443635,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717623.123, "dur": 1.561, + "args": { + "External id": 443636,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717626.471, "dur": 1.615, + "args": { + "External id": 443637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717629.798, "dur": 1.044, + "args": { + "External id": 443638,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717633.032, "dur": 1.523, + "args": { + "External id": 443639,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717636.511, "dur": 2.882, + "args": { + "External id": 443640,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717641.185, "dur": 1.336, + "args": { + "External id": 443641,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007717644.627, "dur": 1.084, + "args": { + "External id": 443642,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007717702.088, "dur": 7684.358, + "args": { + "External id": 443643,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007717718.500, "dur": 7661.065, + "args": { + "External id": 443644,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007717739.042, "dur": 15.038, + "args": { + "External id": 443645,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007717756.990, "dur": 7590.291, + "args": { + "External id": 443646,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007717759.735, "dur": 7587.052, + "args": { + "External id": 443647,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007717765.657, "dur": 8.071, + "args": { + "External id": 443648,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007717775.583, "dur": 7568.064, + "args": { + "External id": 443649,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007725579.334, "dur": 29.884, + "args": { + "External id": 443650,"Sequence number": 5285415, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5873 + } + }, + { + "ph": "s", "id": 185, "pid": 4183441, "tid": 4183441, "ts": 676007725579.334, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007725596.105, "dur": 8.410, + "args": { + "External id": 443651,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007725599.499, "dur": 4.834, + "args": { + "External id": 443652,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007725700.753, "dur": 93.837, + "args": { + "External id": 443653,"Record function id": 0, "Ev Idx": 5876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007725797.296, "dur": 1531.859, + "args": { + "External id": 443654,"Record function id": 0, "Ev Idx": 5877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007725840.723, "dur": 1472.731, + "args": { + "External id": 443655,"Sequence number": 5285416, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5878 + } + }, + { + "ph": "s", "id": 184, "pid": 4183441, "tid": 4183441, "ts": 676007725840.723, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007725911.670, "dur": 44.242, + "args": { + "External id": 443656,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007725969.312, "dur": 92.576, + "args": { + "External id": 443657,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007726070.817, "dur": 422.177, + "args": { + "External id": 443658,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007726516.484, "dur": 39.214, + "args": { + "External id": 443659,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007726586.039, "dur": 28.928, + "args": { + "External id": 443660,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007726632.722, "dur": 15.288, + "args": { + "External id": 443661,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007726706.455, "dur": 145.724, + "args": { + "External id": 443662,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007726762.075, "dur": 14.177, + "args": { + "External id": 443663,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007726768.045, "dur": 7.111, + "args": { + "External id": 443664,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007726778.974, "dur": 6.185, + "args": { + "External id": 443665,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007726786.514, "dur": 1.860, + "args": { + "External id": 443666,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007726790.545, "dur": 3.001, + "args": { + "External id": 443667,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007726863.449, "dur": 64.303, + "args": { + "External id": 443668,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007726959.756, "dur": 30.151, + "args": { + "External id": 443669,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007726997.830, "dur": 42.047, + "args": { + "External id": 443670,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007727048.340, "dur": 31.829, + "args": { + "External id": 443671,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007727119.219, "dur": 26.354, + "args": { + "External id": 443672,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007727152.412, "dur": 44.832, + "args": { + "External id": 443673,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007727219.055, "dur": 16.709, + "args": { + "External id": 443674,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5897 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.13)", "pid": 4183441, "tid": 4183441, + "ts": 676007727398.874, "dur": 84.765, + "args": { + "External id": 443675,"Record function id": 0, "Ev Idx": 5898 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007727555.862, "dur": 50.852, + "args": { + "External id": 443676,"Record function id": 0, "Ev Idx": 5899 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.14)", "pid": 4183441, "tid": 4183441, + "ts": 676007727615.518, "dur": 9145.164, + "args": { + "External id": 443677,"Record function id": 0, "Ev Idx": 5900 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 4183441, "tid": 4183441, + "ts": 676007727625.408, "dur": 934.892, + "args": { + "External id": 443678,"Record function id": 0, "Ev Idx": 5901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007727754.454, "dur": 10.263, + "args": { + "External id": 443679,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007727779.015, "dur": 47.296, + "args": { + "External id": 443680,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727789.084, "dur": 2.715, + "args": { + "External id": 443681,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727796.178, "dur": 0.777, + "args": { + "External id": 443682,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727798.031, "dur": 0.822, + "args": { + "External id": 443683,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727800.324, "dur": 2.519, + "args": { + "External id": 443684,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727804.320, "dur": 0.750, + "args": { + "External id": 443685,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727808.395, "dur": 0.686, + "args": { + "External id": 443686,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727812.188, "dur": 0.472, + "args": { + "External id": 443687,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727813.891, "dur": 0.696, + "args": { + "External id": 443688,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727815.606, "dur": 2.639, + "args": { + "External id": 443689,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007727838.225, "dur": 42.767, + "args": { + "External id": 443690,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007727914.632, "dur": 109.836, + "args": { + "External id": 443691,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007727924.587, "dur": 4.351, + "args": { + "External id": 443692,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007727934.498, "dur": 10.773, + "args": { + "External id": 443693,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007727939.013, "dur": 5.847, + "args": { + "External id": 443694,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727942.590, "dur": 1.063, + "args": { + "External id": 443695,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007727951.385, "dur": 29.059, + "args": { + "External id": 443696,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727953.317, "dur": 0.434, + "args": { + "External id": 443697,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727955.447, "dur": 0.905, + "args": { + "External id": 443698,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727957.435, "dur": 2.385, + "args": { + "External id": 443699,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727961.250, "dur": 0.763, + "args": { + "External id": 443700,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727963.026, "dur": 0.491, + "args": { + "External id": 443701,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727966.723, "dur": 0.421, + "args": { + "External id": 443702,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727968.105, "dur": 0.443, + "args": { + "External id": 443703,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727969.983, "dur": 0.970, + "args": { + "External id": 443704,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007727974.217, "dur": 0.542, + "args": { + "External id": 443705,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007727992.237, "dur": 23.418, + "args": { + "External id": 443706,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007728080.635, "dur": 386.426, + "args": { + "External id": 443707,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 5930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007728126.769, "dur": 335.078, + "args": { + "External id": 443708,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5931, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007728137.808, "dur": 318.830, + "args": { + "External id": 443709,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 5932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007728486.156, "dur": 2.476, + "args": { + "External id": 443710,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5933, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 4183441, "tid": 4183441, + "ts": 676007728580.941, "dur": 7938.795, + "args": { + "External id": 443711,"Record function id": 0, "Ev Idx": 5934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728722.955, "dur": 7.013, + "args": { + "External id": 443712,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 5935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728733.819, "dur": 1.338, + "args": { + "External id": 443713,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728736.815, "dur": 1.372, + "args": { + "External id": 443714,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728739.673, "dur": 1.127, + "args": { + "External id": 443715,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728742.603, "dur": 1.229, + "args": { + "External id": 443716,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728745.820, "dur": 0.984, + "args": { + "External id": 443717,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 5940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728748.915, "dur": 0.876, + "args": { + "External id": 443718,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 5941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728751.532, "dur": 2.880, + "args": { + "External id": 443719,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728756.420, "dur": 1.028, + "args": { + "External id": 443720,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007728759.099, "dur": 1.132, + "args": { + "External id": 443721,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 5944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007728780.592, "dur": 7700.896, + "args": { + "External id": 443722,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007728796.480, "dur": 7678.301, + "args": { + "External id": 443723,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 5946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007728813.469, "dur": 14.520, + "args": { + "External id": 443724,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007728830.474, "dur": 7612.322, + "args": { + "External id": 443725,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 5948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007728833.502, "dur": 7608.860, + "args": { + "External id": 443726,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 5949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007728838.879, "dur": 7.390, + "args": { + "External id": 443727,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007728848.565, "dur": 7590.985, + "args": { + "External id": 443728,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 5951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007736700.947, "dur": 30.901, + "args": { + "External id": 443729,"Sequence number": 5285417, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 5952 + } + }, + { + "ph": "s", "id": 183, "pid": 4183441, "tid": 4183441, "ts": 676007736700.947, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007736718.282, "dur": 8.606, + "args": { + "External id": 443730,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 5953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007736721.659, "dur": 4.878, + "args": { + "External id": 443731,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 5954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007736801.138, "dur": 94.009, + "args": { + "External id": 443732,"Record function id": 0, "Ev Idx": 5955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007736896.743, "dur": 1082.296, + "args": { + "External id": 443733,"Record function id": 0, "Ev Idx": 5956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007736939.004, "dur": 1024.987, + "args": { + "External id": 443734,"Sequence number": 5285418, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 5957 + } + }, + { + "ph": "s", "id": 182, "pid": 4183441, "tid": 4183441, "ts": 676007736939.004, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007737006.286, "dur": 42.263, + "args": { + "External id": 443735,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007737061.455, "dur": 107.603, + "args": { + "External id": 443736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007737181.767, "dur": 35.242, + "args": { + "External id": 443737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007737226.641, "dur": 29.805, + "args": { + "External id": 443738,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007737282.341, "dur": 26.790, + "args": { + "External id": 443739,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007737327.517, "dur": 13.853, + "args": { + "External id": 443740,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007737359.818, "dur": 132.558, + "args": { + "External id": 443741,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 5964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007737414.559, "dur": 12.013, + "args": { + "External id": 443742,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 5965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007737419.601, "dur": 6.140, + "args": { + "External id": 443743,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007737429.200, "dur": 6.469, + "args": { + "External id": 443744,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007737436.809, "dur": 1.473, + "args": { + "External id": 443745,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007737440.695, "dur": 3.166, + "args": { + "External id": 443746,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007737503.546, "dur": 43.915, + "args": { + "External id": 443747,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 5970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007737577.860, "dur": 29.842, + "args": { + "External id": 443748,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 5971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007737615.602, "dur": 73.181, + "args": { + "External id": 443749,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007737702.137, "dur": 37.118, + "args": { + "External id": 443750,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 5973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007737763.567, "dur": 27.232, + "args": { + "External id": 443751,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 5974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007737797.097, "dur": 53.209, + "args": { + "External id": 443752,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 5975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007737871.965, "dur": 20.957, + "args": { + "External id": 443753,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 5976 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.14)", "pid": 4183441, "tid": 4183441, + "ts": 676007738042.392, "dur": 105.960, + "args": { + "External id": 443754,"Record function id": 0, "Ev Idx": 5977 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007738224.789, "dur": 52.324, + "args": { + "External id": 443755,"Record function id": 0, "Ev Idx": 5978 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.15)", "pid": 4183441, "tid": 4183441, + "ts": 676007738287.735, "dur": 9452.988, + "args": { + "External id": 443756,"Record function id": 0, "Ev Idx": 5979 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 4183441, "tid": 4183441, + "ts": 676007738296.219, "dur": 973.341, + "args": { + "External id": 443757,"Record function id": 0, "Ev Idx": 5980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007738385.302, "dur": 9.893, + "args": { + "External id": 443758,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007738408.329, "dur": 37.177, + "args": { + "External id": 443759,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738414.512, "dur": 2.226, + "args": { + "External id": 443760,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738421.007, "dur": 0.533, + "args": { + "External id": 443761,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738422.818, "dur": 0.800, + "args": { + "External id": 443762,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738424.557, "dur": 0.623, + "args": { + "External id": 443763,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738429.105, "dur": 0.429, + "args": { + "External id": 443764,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738430.636, "dur": 0.668, + "args": { + "External id": 443765,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738433.017, "dur": 2.213, + "args": { + "External id": 443766,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738436.191, "dur": 0.412, + "args": { + "External id": 443767,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738437.678, "dur": 0.426, + "args": { + "External id": 443768,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007738460.714, "dur": 46.005, + "args": { + "External id": 443769,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 5992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007738540.715, "dur": 180.961, + "args": { + "External id": 443770,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 5993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007738553.339, "dur": 5.440, + "args": { + "External id": 443771,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007738564.250, "dur": 11.198, + "args": { + "External id": 443772,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007738569.303, "dur": 5.785, + "args": { + "External id": 443773,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 5996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738572.723, "dur": 1.085, + "args": { + "External id": 443774,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 5997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007738582.294, "dur": 32.726, + "args": { + "External id": 443775,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 5998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738584.947, "dur": 2.961, + "args": { + "External id": 443776,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 5999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738589.322, "dur": 0.888, + "args": { + "External id": 443777,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738591.681, "dur": 0.813, + "args": { + "External id": 443778,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738595.740, "dur": 0.548, + "args": { + "External id": 443779,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738597.748, "dur": 0.539, + "args": { + "External id": 443780,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738599.267, "dur": 0.576, + "args": { + "External id": 443781,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738603.328, "dur": 0.624, + "args": { + "External id": 443782,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738605.697, "dur": 0.450, + "args": { + "External id": 443783,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007738607.296, "dur": 2.610, + "args": { + "External id": 443784,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007738638.762, "dur": 66.859, + "args": { + "External id": 443785,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007738781.466, "dur": 393.469, + "args": { + "External id": 443786,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007738808.710, "dur": 360.636, + "args": { + "External id": 443787,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6010, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007738821.623, "dur": 341.711, + "args": { + "External id": 443788,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007739197.250, "dur": 2.489, + "args": { + "External id": 443789,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6012, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 4183441, "tid": 4183441, + "ts": 676007739290.121, "dur": 8213.189, + "args": { + "External id": 443790,"Record function id": 0, "Ev Idx": 6013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739395.003, "dur": 7.192, + "args": { + "External id": 443791,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739405.568, "dur": 1.605, + "args": { + "External id": 443792,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739408.803, "dur": 1.358, + "args": { + "External id": 443793,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739411.652, "dur": 0.866, + "args": { + "External id": 443794,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739414.268, "dur": 1.370, + "args": { + "External id": 443795,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739417.941, "dur": 1.147, + "args": { + "External id": 443796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739421.488, "dur": 1.208, + "args": { + "External id": 443797,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739424.670, "dur": 2.585, + "args": { + "External id": 443798,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739428.845, "dur": 0.967, + "args": { + "External id": 443799,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007739431.488, "dur": 1.146, + "args": { + "External id": 443800,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007739450.887, "dur": 8013.977, + "args": { + "External id": 443801,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007739466.021, "dur": 7991.727, + "args": { + "External id": 443802,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007739481.450, "dur": 14.426, + "args": { + "External id": 443803,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007739499.383, "dur": 7925.405, + "args": { + "External id": 443804,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007739501.965, "dur": 7922.372, + "args": { + "External id": 443805,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007739508.534, "dur": 8.115, + "args": { + "External id": 443806,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007739518.550, "dur": 7903.143, + "args": { + "External id": 443807,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007747680.584, "dur": 33.946, + "args": { + "External id": 443808,"Sequence number": 5285419, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6031 + } + }, + { + "ph": "s", "id": 181, "pid": 4183441, "tid": 4183441, "ts": 676007747680.584, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007747699.911, "dur": 9.453, + "args": { + "External id": 443809,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007747703.477, "dur": 5.574, + "args": { + "External id": 443810,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007747779.919, "dur": 92.445, + "args": { + "External id": 443811,"Record function id": 0, "Ev Idx": 6034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007747873.991, "dur": 1137.946, + "args": { + "External id": 443812,"Record function id": 0, "Ev Idx": 6035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007747917.129, "dur": 1079.890, + "args": { + "External id": 443813,"Sequence number": 5285420, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6036 + } + }, + { + "ph": "s", "id": 180, "pid": 4183441, "tid": 4183441, "ts": 676007747917.129, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007747986.619, "dur": 42.914, + "args": { + "External id": 443814,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007748042.824, "dur": 112.532, + "args": { + "External id": 443815,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007748167.525, "dur": 37.511, + "args": { + "External id": 443816,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007748214.283, "dur": 30.476, + "args": { + "External id": 443817,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007748271.022, "dur": 26.226, + "args": { + "External id": 443818,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007748314.944, "dur": 14.784, + "args": { + "External id": 443819,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007748347.923, "dur": 136.628, + "args": { + "External id": 443820,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007748399.863, "dur": 12.791, + "args": { + "External id": 443821,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007748405.289, "dur": 6.407, + "args": { + "External id": 443822,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007748415.345, "dur": 6.229, + "args": { + "External id": 443823,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007748422.899, "dur": 1.666, + "args": { + "External id": 443824,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007748426.930, "dur": 2.635, + "args": { + "External id": 443825,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007748508.552, "dur": 52.479, + "args": { + "External id": 443826,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007748594.907, "dur": 31.874, + "args": { + "External id": 443827,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007748634.938, "dur": 79.199, + "args": { + "External id": 443828,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007748727.756, "dur": 51.268, + "args": { + "External id": 443829,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007748802.551, "dur": 26.496, + "args": { + "External id": 443830,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007748835.207, "dur": 46.286, + "args": { + "External id": 443831,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007748901.985, "dur": 16.985, + "args": { + "External id": 443832,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6055 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.15)", "pid": 4183441, "tid": 4183441, + "ts": 676007749075.925, "dur": 100.546, + "args": { + "External id": 443833,"Record function id": 0, "Ev Idx": 6056 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007749254.288, "dur": 47.971, + "args": { + "External id": 443834,"Record function id": 0, "Ev Idx": 6057 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.16)", "pid": 4183441, "tid": 4183441, + "ts": 676007749311.013, "dur": 9478.470, + "args": { + "External id": 443835,"Record function id": 0, "Ev Idx": 6058 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 4183441, "tid": 4183441, + "ts": 676007749319.610, "dur": 985.061, + "args": { + "External id": 443836,"Record function id": 0, "Ev Idx": 6059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007749405.419, "dur": 8.967, + "args": { + "External id": 443837,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007749426.769, "dur": 37.586, + "args": { + "External id": 443838,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749432.032, "dur": 2.543, + "args": { + "External id": 443839,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749438.653, "dur": 0.732, + "args": { + "External id": 443840,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749440.698, "dur": 0.461, + "args": { + "External id": 443841,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749442.982, "dur": 0.732, + "args": { + "External id": 443842,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749447.372, "dur": 0.526, + "args": { + "External id": 443843,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749449.291, "dur": 1.003, + "args": { + "External id": 443844,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749451.385, "dur": 2.357, + "args": { + "External id": 443845,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749455.208, "dur": 0.402, + "args": { + "External id": 443846,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749456.572, "dur": 0.494, + "args": { + "External id": 443847,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007749479.619, "dur": 41.900, + "args": { + "External id": 443848,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007749554.465, "dur": 152.172, + "args": { + "External id": 443849,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007749564.844, "dur": 5.794, + "args": { + "External id": 443850,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007749576.479, "dur": 10.265, + "args": { + "External id": 443851,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007749580.994, "dur": 5.328, + "args": { + "External id": 443852,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749584.304, "dur": 0.833, + "args": { + "External id": 443853,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007749592.597, "dur": 30.053, + "args": { + "External id": 443854,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749594.676, "dur": 0.605, + "args": { + "External id": 443855,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749596.700, "dur": 2.880, + "args": { + "External id": 443856,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749600.642, "dur": 0.791, + "args": { + "External id": 443857,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749602.932, "dur": 0.697, + "args": { + "External id": 443858,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749606.616, "dur": 0.793, + "args": { + "External id": 443859,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749608.829, "dur": 0.883, + "args": { + "External id": 443860,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749610.696, "dur": 0.658, + "args": { + "External id": 443861,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749614.305, "dur": 0.740, + "args": { + "External id": 443862,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007749616.052, "dur": 0.909, + "args": { + "External id": 443863,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007749632.768, "dur": 63.836, + "args": { + "External id": 443864,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007749763.400, "dur": 442.708, + "args": { + "External id": 443865,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007749791.379, "dur": 408.868, + "args": { + "External id": 443866,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6089, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007749802.128, "dur": 389.606, + "args": { + "External id": 443867,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007750228.964, "dur": 2.419, + "args": { + "External id": 443868,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6091, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 4183441, "tid": 4183441, + "ts": 676007750324.874, "dur": 8221.404, + "args": { + "External id": 443869,"Record function id": 0, "Ev Idx": 6092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750428.069, "dur": 6.799, + "args": { + "External id": 443870,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750438.308, "dur": 1.515, + "args": { + "External id": 443871,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750441.684, "dur": 1.619, + "args": { + "External id": 443872,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750445.175, "dur": 1.790, + "args": { + "External id": 443873,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750448.463, "dur": 1.569, + "args": { + "External id": 443874,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750451.699, "dur": 0.999, + "args": { + "External id": 443875,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750454.643, "dur": 1.395, + "args": { + "External id": 443876,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750457.903, "dur": 2.927, + "args": { + "External id": 443877,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750462.452, "dur": 1.102, + "args": { + "External id": 443878,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007750465.408, "dur": 1.258, + "args": { + "External id": 443879,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007750484.968, "dur": 8024.975, + "args": { + "External id": 443880,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007750500.689, "dur": 8002.592, + "args": { + "External id": 443881,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007750516.032, "dur": 14.551, + "args": { + "External id": 443882,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007750533.377, "dur": 7938.553, + "args": { + "External id": 443883,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007750535.856, "dur": 7935.601, + "args": { + "External id": 443884,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007750542.684, "dur": 7.178, + "args": { + "External id": 443885,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007750551.694, "dur": 7916.800, + "args": { + "External id": 443886,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007758731.859, "dur": 31.200, + "args": { + "External id": 443887,"Sequence number": 5285421, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6110 + } + }, + { + "ph": "s", "id": 179, "pid": 4183441, "tid": 4183441, "ts": 676007758731.859, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007758749.002, "dur": 8.803, + "args": { + "External id": 443888,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007758752.312, "dur": 5.035, + "args": { + "External id": 443889,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007758829.247, "dur": 93.008, + "args": { + "External id": 443890,"Record function id": 0, "Ev Idx": 6113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007758924.032, "dur": 1126.240, + "args": { + "External id": 443891,"Record function id": 0, "Ev Idx": 6114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007758963.039, "dur": 1072.451, + "args": { + "External id": 443892,"Sequence number": 5285422, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6115 + } + }, + { + "ph": "s", "id": 178, "pid": 4183441, "tid": 4183441, "ts": 676007758963.039, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007759031.451, "dur": 44.961, + "args": { + "External id": 443893,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007759107.285, "dur": 93.524, + "args": { + "External id": 443894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007759211.322, "dur": 34.510, + "args": { + "External id": 443895,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007759254.942, "dur": 29.024, + "args": { + "External id": 443896,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007759315.135, "dur": 28.448, + "args": { + "External id": 443897,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007759359.060, "dur": 14.555, + "args": { + "External id": 443898,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007759391.145, "dur": 137.374, + "args": { + "External id": 443899,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007759446.725, "dur": 11.920, + "args": { + "External id": 443900,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007759452.290, "dur": 5.414, + "args": { + "External id": 443901,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007759461.411, "dur": 6.213, + "args": { + "External id": 443902,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007759469.021, "dur": 1.919, + "args": { + "External id": 443903,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007759473.260, "dur": 5.191, + "args": { + "External id": 443904,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007759558.584, "dur": 55.359, + "args": { + "External id": 443905,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007759648.019, "dur": 68.831, + "args": { + "External id": 443906,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007759728.863, "dur": 42.150, + "args": { + "External id": 443907,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007759779.655, "dur": 47.541, + "args": { + "External id": 443908,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007759850.226, "dur": 24.138, + "args": { + "External id": 443909,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007759879.926, "dur": 45.958, + "args": { + "External id": 443910,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007759946.374, "dur": 18.158, + "args": { + "External id": 443911,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6134 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.16)", "pid": 4183441, "tid": 4183441, + "ts": 676007760130.565, "dur": 83.712, + "args": { + "External id": 443912,"Record function id": 0, "Ev Idx": 6135 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007760290.273, "dur": 47.807, + "args": { + "External id": 443913,"Record function id": 0, "Ev Idx": 6136 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.17)", "pid": 4183441, "tid": 4183441, + "ts": 676007760347.407, "dur": 9348.329, + "args": { + "External id": 443914,"Record function id": 0, "Ev Idx": 6137 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 4183441, "tid": 4183441, + "ts": 676007760356.191, "dur": 935.063, + "args": { + "External id": 443915,"Record function id": 0, "Ev Idx": 6138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007760440.983, "dur": 9.250, + "args": { + "External id": 443916,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007760463.555, "dur": 37.921, + "args": { + "External id": 443917,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760469.026, "dur": 2.551, + "args": { + "External id": 443918,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760475.880, "dur": 0.658, + "args": { + "External id": 443919,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760478.024, "dur": 0.591, + "args": { + "External id": 443920,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760480.240, "dur": 0.677, + "args": { + "External id": 443921,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760484.305, "dur": 0.677, + "args": { + "External id": 443922,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760486.416, "dur": 0.535, + "args": { + "External id": 443923,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760487.902, "dur": 2.365, + "args": { + "External id": 443924,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760491.905, "dur": 0.380, + "args": { + "External id": 443925,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760493.464, "dur": 0.498, + "args": { + "External id": 443926,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007760513.883, "dur": 41.840, + "args": { + "External id": 443927,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007760588.938, "dur": 156.871, + "args": { + "External id": 443928,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007760599.251, "dur": 4.571, + "args": { + "External id": 443929,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007760609.550, "dur": 10.964, + "args": { + "External id": 443930,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007760614.179, "dur": 5.950, + "args": { + "External id": 443931,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760617.919, "dur": 0.904, + "args": { + "External id": 443932,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007760626.783, "dur": 67.996, + "args": { + "External id": 443933,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760628.643, "dur": 2.273, + "args": { + "External id": 443934,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760632.421, "dur": 0.630, + "args": { + "External id": 443935,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760634.256, "dur": 1.066, + "args": { + "External id": 443936,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760638.681, "dur": 0.404, + "args": { + "External id": 443937,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760640.365, "dur": 0.530, + "args": { + "External id": 443938,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760643.099, "dur": 0.629, + "args": { + "External id": 443939,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760646.469, "dur": 0.550, + "args": { + "External id": 443940,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760648.035, "dur": 0.417, + "args": { + "External id": 443941,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007760649.774, "dur": 38.952, + "args": { + "External id": 443942,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007760711.359, "dur": 26.176, + "args": { + "External id": 443943,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007760801.655, "dur": 394.322, + "args": { + "External id": 443944,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007760827.728, "dur": 363.268, + "args": { + "External id": 443945,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6168, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007760838.765, "dur": 343.679, + "args": { + "External id": 443946,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007761217.822, "dur": 2.334, + "args": { + "External id": 443947,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6170, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 4183441, "tid": 4183441, + "ts": 676007761313.784, "dur": 8142.969, + "args": { + "External id": 443948,"Record function id": 0, "Ev Idx": 6171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761414.909, "dur": 6.617, + "args": { + "External id": 443949,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761425.051, "dur": 1.396, + "args": { + "External id": 443950,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761428.293, "dur": 1.222, + "args": { + "External id": 443951,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761431.243, "dur": 1.107, + "args": { + "External id": 443952,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761433.823, "dur": 1.442, + "args": { + "External id": 443953,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761436.804, "dur": 1.252, + "args": { + "External id": 443954,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761440.159, "dur": 0.876, + "args": { + "External id": 443955,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761442.661, "dur": 1.774, + "args": { + "External id": 443956,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761446.049, "dur": 1.049, + "args": { + "External id": 443957,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007761449.349, "dur": 1.068, + "args": { + "External id": 443958,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007761468.628, "dur": 7949.933, + "args": { + "External id": 443959,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007761484.500, "dur": 7927.537, + "args": { + "External id": 443960,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007761501.914, "dur": 13.892, + "args": { + "External id": 443961,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007761518.865, "dur": 7861.287, + "args": { + "External id": 443962,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007761521.449, "dur": 7858.265, + "args": { + "External id": 443963,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007761527.556, "dur": 7.125, + "args": { + "External id": 443964,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007761536.351, "dur": 7840.544, + "args": { + "External id": 443965,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007769610.722, "dur": 29.532, + "args": { + "External id": 443966,"Sequence number": 5285423, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6189 + } + }, + { + "ph": "s", "id": 177, "pid": 4183441, "tid": 4183441, "ts": 676007769610.722, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007769627.161, "dur": 8.278, + "args": { + "External id": 443967,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007769630.451, "dur": 4.728, + "args": { + "External id": 443968,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007769738.968, "dur": 90.951, + "args": { + "External id": 443969,"Record function id": 0, "Ev Idx": 6192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007769831.957, "dur": 1102.833, + "args": { + "External id": 443970,"Record function id": 0, "Ev Idx": 6193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007769875.996, "dur": 1044.323, + "args": { + "External id": 443971,"Sequence number": 5285424, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6194 + } + }, + { + "ph": "s", "id": 176, "pid": 4183441, "tid": 4183441, "ts": 676007769875.996, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007769947.605, "dur": 43.006, + "args": { + "External id": 443972,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007770005.241, "dur": 109.469, + "args": { + "External id": 443973,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007770127.735, "dur": 37.877, + "args": { + "External id": 443974,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007770174.161, "dur": 29.542, + "args": { + "External id": 443975,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007770230.043, "dur": 26.302, + "args": { + "External id": 443976,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007770273.996, "dur": 14.279, + "args": { + "External id": 443977,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007770306.416, "dur": 132.074, + "args": { + "External id": 443978,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007770357.430, "dur": 12.374, + "args": { + "External id": 443979,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007770362.816, "dur": 6.187, + "args": { + "External id": 443980,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007770372.714, "dur": 6.394, + "args": { + "External id": 443981,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007770380.851, "dur": 1.735, + "args": { + "External id": 443982,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007770384.699, "dur": 3.274, + "args": { + "External id": 443983,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007770449.852, "dur": 43.801, + "args": { + "External id": 443984,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007770525.168, "dur": 27.615, + "args": { + "External id": 443985,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007770560.719, "dur": 37.572, + "args": { + "External id": 443986,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007770606.663, "dur": 31.485, + "args": { + "External id": 443987,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007770708.713, "dur": 32.081, + "args": { + "External id": 443988,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007770748.547, "dur": 55.789, + "args": { + "External id": 443989,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007770825.623, "dur": 18.656, + "args": { + "External id": 443990,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6213 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.17)", "pid": 4183441, "tid": 4183441, + "ts": 676007770999.605, "dur": 96.659, + "args": { + "External id": 443991,"Record function id": 0, "Ev Idx": 6214 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007771173.812, "dur": 48.076, + "args": { + "External id": 443992,"Record function id": 0, "Ev Idx": 6215 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.18)", "pid": 4183441, "tid": 4183441, + "ts": 676007771231.417, "dur": 9372.336, + "args": { + "External id": 443993,"Record function id": 0, "Ev Idx": 6216 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 4183441, "tid": 4183441, + "ts": 676007771239.839, "dur": 920.324, + "args": { + "External id": 443994,"Record function id": 0, "Ev Idx": 6217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007771328.227, "dur": 10.281, + "args": { + "External id": 443995,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007771352.050, "dur": 36.201, + "args": { + "External id": 443996,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771357.114, "dur": 2.391, + "args": { + "External id": 443997,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771364.115, "dur": 0.470, + "args": { + "External id": 443998,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771366.066, "dur": 0.770, + "args": { + "External id": 443999,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771368.095, "dur": 0.686, + "args": { + "External id": 444000,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771371.534, "dur": 0.772, + "args": { + "External id": 444001,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771373.893, "dur": 0.645, + "args": { + "External id": 444002,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771375.946, "dur": 2.587, + "args": { + "External id": 444003,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771379.899, "dur": 0.693, + "args": { + "External id": 444004,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771381.565, "dur": 0.632, + "args": { + "External id": 444005,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007771399.275, "dur": 42.737, + "args": { + "External id": 444006,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007771474.113, "dur": 111.703, + "args": { + "External id": 444007,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007771487.857, "dur": 5.577, + "args": { + "External id": 444008,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007771499.071, "dur": 10.276, + "args": { + "External id": 444009,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007771503.500, "dur": 5.445, + "args": { + "External id": 444010,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771507.114, "dur": 0.683, + "args": { + "External id": 444011,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007771516.017, "dur": 26.947, + "args": { + "External id": 444012,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771517.959, "dur": 0.405, + "args": { + "External id": 444013,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771519.817, "dur": 2.667, + "args": { + "External id": 444014,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771523.825, "dur": 0.639, + "args": { + "External id": 444015,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771525.453, "dur": 0.482, + "args": { + "External id": 444016,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771529.304, "dur": 0.508, + "args": { + "External id": 444017,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771530.783, "dur": 0.594, + "args": { + "External id": 444018,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771532.644, "dur": 0.389, + "args": { + "External id": 444019,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771536.200, "dur": 0.434, + "args": { + "External id": 444020,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007771538.357, "dur": 0.416, + "args": { + "External id": 444021,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007771554.891, "dur": 22.910, + "args": { + "External id": 444022,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007771636.779, "dur": 410.637, + "args": { + "External id": 444023,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007771702.322, "dur": 339.622, + "args": { + "External id": 444024,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6247, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007771714.588, "dur": 321.916, + "args": { + "External id": 444025,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007772068.397, "dur": 2.131, + "args": { + "External id": 444026,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6249, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 4183441, "tid": 4183441, + "ts": 676007772182.544, "dur": 8208.176, + "args": { + "External id": 444027,"Record function id": 0, "Ev Idx": 6250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772286.212, "dur": 6.363, + "args": { + "External id": 444028,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772295.983, "dur": 1.146, + "args": { + "External id": 444029,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772298.686, "dur": 1.473, + "args": { + "External id": 444030,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772301.688, "dur": 0.911, + "args": { + "External id": 444031,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772304.490, "dur": 1.262, + "args": { + "External id": 444032,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772307.355, "dur": 1.000, + "args": { + "External id": 444033,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772310.302, "dur": 0.989, + "args": { + "External id": 444034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772313.436, "dur": 2.459, + "args": { + "External id": 444035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772317.738, "dur": 1.088, + "args": { + "External id": 444036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007772320.619, "dur": 0.972, + "args": { + "External id": 444037,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007772340.092, "dur": 8012.796, + "args": { + "External id": 444038,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007772355.101, "dur": 7991.143, + "args": { + "External id": 444039,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007772371.997, "dur": 13.951, + "args": { + "External id": 444040,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007772388.779, "dur": 7925.240, + "args": { + "External id": 444041,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007772391.168, "dur": 7922.369, + "args": { + "External id": 444042,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007772397.680, "dur": 5.690, + "args": { + "External id": 444043,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007772405.394, "dur": 7905.050, + "args": { + "External id": 444044,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007780539.318, "dur": 35.822, + "args": { + "External id": 444045,"Sequence number": 5285425, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6268 + } + }, + { + "ph": "s", "id": 175, "pid": 4183441, "tid": 4183441, "ts": 676007780539.318, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007780561.847, "dur": 8.095, + "args": { + "External id": 444046,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007780565.105, "dur": 4.584, + "args": { + "External id": 444047,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007780643.620, "dur": 120.374, + "args": { + "External id": 444048,"Record function id": 0, "Ev Idx": 6271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007780767.740, "dur": 1103.570, + "args": { + "External id": 444049,"Record function id": 0, "Ev Idx": 6272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007780811.064, "dur": 1045.961, + "args": { + "External id": 444050,"Sequence number": 5285426, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6273 + } + }, + { + "ph": "s", "id": 174, "pid": 4183441, "tid": 4183441, "ts": 676007780811.064, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007780885.663, "dur": 44.800, + "args": { + "External id": 444051,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007780946.063, "dur": 96.292, + "args": { + "External id": 444052,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007781050.837, "dur": 51.449, + "args": { + "External id": 444053,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007781111.931, "dur": 33.669, + "args": { + "External id": 444054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007781173.357, "dur": 27.799, + "args": { + "External id": 444055,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007781217.374, "dur": 17.664, + "args": { + "External id": 444056,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007781252.318, "dur": 130.968, + "args": { + "External id": 444057,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007781303.833, "dur": 12.001, + "args": { + "External id": 444058,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007781308.943, "dur": 6.088, + "args": { + "External id": 444059,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007781318.598, "dur": 4.553, + "args": { + "External id": 444060,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007781324.421, "dur": 3.880, + "args": { + "External id": 444061,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007781330.859, "dur": 3.093, + "args": { + "External id": 444062,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007781393.731, "dur": 49.972, + "args": { + "External id": 444063,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007781475.230, "dur": 29.621, + "args": { + "External id": 444064,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007781513.128, "dur": 37.421, + "args": { + "External id": 444065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007781557.447, "dur": 31.287, + "args": { + "External id": 444066,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007781612.617, "dur": 26.469, + "args": { + "External id": 444067,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007781645.156, "dur": 96.005, + "args": { + "External id": 444068,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007781765.389, "dur": 21.041, + "args": { + "External id": 444069,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6292 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.18)", "pid": 4183441, "tid": 4183441, + "ts": 676007781935.432, "dur": 80.268, + "args": { + "External id": 444070,"Record function id": 0, "Ev Idx": 6293 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 4183441, "tid": 4183441, + "ts": 676007782107.590, "dur": 49.418, + "args": { + "External id": 444071,"Record function id": 0, "Ev Idx": 6294 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.19)", "pid": 4183441, "tid": 4183441, + "ts": 676007782166.094, "dur": 9370.687, + "args": { + "External id": 444072,"Record function id": 0, "Ev Idx": 6295 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 4183441, "tid": 4183441, + "ts": 676007782174.430, "dur": 927.059, + "args": { + "External id": 444073,"Record function id": 0, "Ev Idx": 6296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007782261.295, "dur": 9.844, + "args": { + "External id": 444074,"Record function id": 0, "Concrete Inputs": ["[1605888]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007782285.053, "dur": 36.479, + "args": { + "External id": 444075,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782290.829, "dur": 2.444, + "args": { + "External id": 444076,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782297.943, "dur": 0.584, + "args": { + "External id": 444077,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "128"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782299.783, "dur": 0.820, + "args": { + "External id": 444078,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "131200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782302.396, "dur": 0.753, + "args": { + "External id": 444079,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "262272"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782306.028, "dur": 0.784, + "args": { + "External id": 444080,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "393344"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782307.858, "dur": 0.590, + "args": { + "External id": 444081,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "524416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782309.360, "dur": 2.311, + "args": { + "External id": 444082,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782312.851, "dur": 0.564, + "args": { + "External id": 444083,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "884992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782314.436, "dur": 0.594, + "args": { + "External id": 444084,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "1245440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007782334.163, "dur": 42.124, + "args": { + "External id": 444085,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 4183441, "tid": 4183441, + "ts": 676007782408.575, "dur": 114.441, + "args": { + "External id": 444086,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1605888", "8", "5", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [], [], [], [], [], []], "Ev Idx": 6309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007782418.605, "dur": 4.808, + "args": { + "External id": 444087,"Record function id": 0, "Concrete Inputs": ["[12847104]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 4183441, "tid": 4183441, + "ts": 676007782428.827, "dur": 10.515, + "args": { + "External id": 444088,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "1605888"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007782433.422, "dur": 5.537, + "args": { + "External id": 444089,"Record function id": 0, "Concrete Inputs": ["", "0", "8029440", "9635328", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[12847104], [], [], [], []], "Ev Idx": 6312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782437.024, "dur": 0.704, + "args": { + "External id": 444090,"Record function id": 0, "Concrete Inputs": ["", "[1605888]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[12847104], [], [], []], "Ev Idx": 6313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 4183441, "tid": 4183441, + "ts": 676007782445.703, "dur": 32.296, + "args": { + "External id": 444091,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1605888], [], []], "Ev Idx": 6314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782447.456, "dur": 2.796, + "args": { + "External id": 444092,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8029440"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782451.715, "dur": 0.924, + "args": { + "External id": 444093,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8029568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782453.800, "dur": 0.897, + "args": { + "External id": 444094,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8160640"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782458.375, "dur": 0.689, + "args": { + "External id": 444095,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8291712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782460.151, "dur": 0.731, + "args": { + "External id": 444096,"Record function id": 0, "Concrete Inputs": ["", "[131072]", "[1]", "8422784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782462.208, "dur": 0.651, + "args": { + "External id": 444097,"Record function id": 0, "Concrete Inputs": ["", "[128]", "[1]", "8553856"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782465.826, "dur": 0.952, + "args": { + "External id": 444098,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8553984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782467.941, "dur": 0.591, + "args": { + "External id": 444099,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "8914432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007782469.909, "dur": 2.716, + "args": { + "External id": 444100,"Record function id": 0, "Concrete Inputs": ["", "[360448]", "[1]", "9274880"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[1605888], [], [], []], "Ev Idx": 6323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007782491.623, "dur": 23.443, + "args": { + "External id": 444101,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], [[128], [131072], [131072], [131072], [131072], [128], [360448], [360448], [360448]], []], "Ev Idx": 6324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 4183441, "tid": 4183441, + "ts": 676007782575.746, "dur": 412.866, + "args": { + "External id": 444102,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[12847104], [1605888], [], [], []], "Ev Idx": 6325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007782601.637, "dur": 381.348, + "args": { + "External id": 444103,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 5, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 12847104, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[1605888], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6326, "In msg nelems": 1605888 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 4183441, "tid": 4183441, + "ts": 676007782611.717, "dur": 365.306, + "args": { + "External id": 444104,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[1605888]], "Ev Idx": 6327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676007783011.402, "dur": 2.393, + "args": { + "External id": 444105,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6328, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 4183441, "tid": 4183441, + "ts": 676007783126.151, "dur": 8205.401, + "args": { + "External id": 444106,"Record function id": 0, "Ev Idx": 6329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783231.756, "dur": 6.812, + "args": { + "External id": 444107,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[12847104], []], "Ev Idx": 6330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783251.452, "dur": 1.818, + "args": { + "External id": 444108,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783255.064, "dur": 1.415, + "args": { + "External id": 444109,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783258.039, "dur": 0.937, + "args": { + "External id": 444110,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783260.420, "dur": 1.210, + "args": { + "External id": 444111,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783263.246, "dur": 1.484, + "args": { + "External id": 444112,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1048576], []], "Ev Idx": 6335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783266.763, "dur": 0.928, + "args": { + "External id": 444113,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[1024], []], "Ev Idx": 6336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783269.292, "dur": 2.865, + "args": { + "External id": 444114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783273.843, "dur": 1.053, + "args": { + "External id": 444115,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007783276.793, "dur": 0.858, + "args": { + "External id": 444116,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2883584], []], "Ev Idx": 6339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007783297.335, "dur": 7997.247, + "args": { + "External id": 444117,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007783312.866, "dur": 7975.246, + "args": { + "External id": 444118,"Record function id": 0, "Concrete Inputs": ["", "[128, 131072, 131072, 131072, 131072, 128, 360448, 360448, 360448]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[1605888, 1], [], [], [[128, 1], [131072, 1], [131072, 1], [131072, 1], [131072, 1], [128, 1], [360448, 1], [360448, 1], [360448, 1]]], "Input Dims": [[8, 1605888], [], [], [[8, 128], [8, 131072], [8, 131072], [8, 131072], [8, 131072], [8, 128], [8, 360448], [8, 360448], [8, 360448]]], "Ev Idx": 6341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007783327.501, "dur": 14.831, + "args": { + "External id": 444119,"Record function id": 0, "Concrete Inputs": ["[823]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007783344.872, "dur": 7912.156, + "args": { + "External id": 444120,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], [], []], "Ev Idx": 6343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007783347.662, "dur": 7908.667, + "args": { + "External id": 444121,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[823], [], [], [], [], [], []], "Ev Idx": 6344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007783353.430, "dur": 5.705, + "args": { + "External id": 444122,"Record function id": 0, "Concrete Inputs": ["[823]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007783360.984, "dur": 7892.841, + "args": { + "External id": 444123,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[823], [823], []], "Ev Idx": 6346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007791481.300, "dur": 30.448, + "args": { + "External id": 444124,"Sequence number": 5285427, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024]], "Ev Idx": 6347 + } + }, + { + "ph": "s", "id": 173, "pid": 4183441, "tid": 4183441, "ts": 676007791481.300, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676007791498.899, "dur": 8.119, + "args": { + "External id": 444125,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1]], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024]], "Ev Idx": 6348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007791502.131, "dur": 4.662, + "args": { + "External id": 444126,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007791574.367, "dur": 119.981, + "args": { + "External id": 444127,"Record function id": 0, "Ev Idx": 6350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 4183441, "tid": 4183441, + "ts": 676007791697.461, "dur": 1062.332, + "args": { + "External id": 444128,"Record function id": 0, "Ev Idx": 6351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007791739.653, "dur": 1005.081, + "args": { + "External id": 444129,"Sequence number": 5285428, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1], [1024, 1], [1024, 1], [1024, 1], [32, 1], [32, 1], [1024, 1], [1], [1024, 1], [1024, 1], [2816, 1]], "Input Dims": [[16, 4096, 1024], [1024], [1024, 1024], [1024, 1024], [1024, 1024], [8192, 32], [8192, 32], [1024, 1024], [1024], [2816, 1024], [2816, 1024], [1024, 2816]], "Ev Idx": 6352 + } + }, + { + "ph": "s", "id": 172, "pid": 4183441, "tid": 4183441, "ts": 676007791739.653, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007791808.769, "dur": 43.714, + "args": { + "External id": 444130,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007791867.618, "dur": 93.757, + "args": { + "External id": 444131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007791970.502, "dur": 33.557, + "args": { + "External id": 444132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007792012.854, "dur": 28.440, + "args": { + "External id": 444133,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007792064.188, "dur": 41.361, + "args": { + "External id": 444134,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 4183441, "tid": 4183441, + "ts": 676007792126.228, "dur": 15.305, + "args": { + "External id": 444135,"kernel_hash": "cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "16", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/fg/cfgbunk6pj5cbcf26yzakiert2ar3scfxn73vpkwgmaeb47aofuy.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007792160.065, "dur": 130.181, + "args": { + "External id": 444136,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007792211.956, "dur": 13.146, + "args": { + "External id": 444137,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007792217.600, "dur": 6.653, + "args": { + "External id": 444138,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007792228.175, "dur": 4.309, + "args": { + "External id": 444139,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007792233.835, "dur": 1.673, + "args": { + "External id": 444140,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007792237.851, "dur": 2.645, + "args": { + "External id": 444141,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007792300.964, "dur": 48.865, + "args": { + "External id": 444142,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [1024, 1]], "Input Dims": [[65536, 1024], [1024, 1024], [65536, 1024]], "Ev Idx": 6365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 4183441, "tid": 4183441, + "ts": 676007792381.438, "dur": 30.975, + "args": { + "External id": 444143,"kernel_hash": "clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/lc/clcngfbq5gg5fhozf3aqmypm7kzb5btr6pwzqk75thmiisp56t2a.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1024, 1], [1024, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536, 1024], [1024], [65536, 1024], [65536, 1024], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007792420.037, "dur": 37.934, + "args": { + "External id": 444144,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007792466.834, "dur": 31.277, + "args": { + "External id": 444145,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024], [2816, 1]], "Input Dims": [[65536, 1024], [1024, 2816], [65536, 2816]], "Ev Idx": 6368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 4183441, "tid": 4183441, + "ts": 676007792519.460, "dur": 24.584, + "args": { + "External id": 444146,"kernel_hash": "c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab", "grid": "grid(184549376,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "184549376"], "kernel_file": "/tmp/torchinductor_cvm/7l/c7lfzweae4ij4e73sdwkv3irxt4dpgqoiir4uwsg5ntelgfnjmab.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2816, 1], [2816, 1], [11534336, 2816, 1], []], "Input Dims": [[65536, 2816], [65536, 2816], [16, 4096, 2816], []], "Ev Idx": 6369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007792549.810, "dur": 47.268, + "args": { + "External id": 444147,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816], [1024, 1]], "Input Dims": [[65536, 2816], [2816, 1024], [65536, 1024]], "Ev Idx": 6370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 4183441, "tid": 4183441, + "ts": 676007792616.744, "dur": 17.353, + "args": { + "External id": 444148,"kernel_hash": "c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu", "grid": "grid(67108864,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "67108864"], "kernel_file": "/tmp/torchinductor_cvm/7i/c7ixwyptf6e33ugfafyyobufdrjo6jntcezqykswcamcywku44gu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [65536, 1024], []], "Ev Idx": 6371 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.19)", "pid": 4183441, "tid": 4183441, + "ts": 676007792825.754, "dur": 33.840, + "args": { + "External id": 444149,"Record function id": 0, "Ev Idx": 6372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007792942.596, "dur": 294.664, + "args": { + "External id": 444150,"Sequence number": 5285429, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6373 + } + }, + { + "ph": "s", "id": 171, "pid": 4183441, "tid": 4183441, "ts": 676007792942.596, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007792973.126, "dur": 7.921, + "args": { + "External id": 444151,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007792975.105, "dur": 5.714, + "args": { + "External id": 444152,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007792990.944, "dur": 12.539, + "args": { + "External id": 444153,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007792994.544, "dur": 8.297, + "args": { + "External id": 444154,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007793011.257, "dur": 4.555, + "args": { + "External id": 444155,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007793214.632, "dur": 7.833, + "args": { + "External id": 444156,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007793218.269, "dur": 3.785, + "args": { + "External id": 444157,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007793267.334, "dur": 133.263, + "args": { + "External id": 444158,"Sequence number": 5285430, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007793270.387, "dur": 16.198, + "args": { + "External id": 444159,"Sequence number": 5285430, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6382 + } + }, + { + "ph": "s", "id": 170, "pid": 4183441, "tid": 4183441, "ts": 676007793270.387, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007793277.588, "dur": 7.099, + "args": { + "External id": 444160,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007793281.834, "dur": 2.490, + "args": { + "External id": 444161,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007793289.741, "dur": 110.427, + "args": { + "External id": 444162,"Sequence number": 5285431, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007793292.998, "dur": 5.800, + "args": { + "External id": 444163,"Sequence number": 5285431, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007793294.609, "dur": 4.051, + "args": { + "External id": 444164,"Sequence number": 5285431, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6387 + } + }, + { + "ph": "s", "id": 169, "pid": 4183441, "tid": 4183441, "ts": 676007793294.609, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007793301.337, "dur": 87.751, + "args": { + "External id": 444165,"Sequence number": 5285432, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6388 + } + }, + { + "ph": "s", "id": 168, "pid": 4183441, "tid": 4183441, "ts": 676007793301.337, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007793392.050, "dur": 6.585, + "args": { + "External id": 444166,"Sequence number": 5285433, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6389 + } + }, + { + "ph": "s", "id": 167, "pid": 4183441, "tid": 4183441, "ts": 676007793392.050, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007793411.082, "dur": 64.123, + "args": { + "External id": 444167,"Sequence number": 5285434, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007793412.184, "dur": 7.116, + "args": { + "External id": 444168,"Sequence number": 5285434, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6391 + } + }, + { + "ph": "s", "id": 166, "pid": 4183441, "tid": 4183441, "ts": 676007793412.184, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007793414.569, "dur": 3.319, + "args": { + "External id": 444169,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007793416.640, "dur": 1.100, + "args": { + "External id": 444170,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007793420.379, "dur": 54.574, + "args": { + "External id": 444171,"Sequence number": 5285435, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007793421.706, "dur": 6.016, + "args": { + "External id": 444172,"Sequence number": 5285435, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007793423.119, "dur": 4.428, + "args": { + "External id": 444173,"Sequence number": 5285435, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6396 + } + }, + { + "ph": "s", "id": 165, "pid": 4183441, "tid": 4183441, "ts": 676007793423.119, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007793429.106, "dur": 39.137, + "args": { + "External id": 444174,"Sequence number": 5285436, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6397 + } + }, + { + "ph": "s", "id": 164, "pid": 4183441, "tid": 4183441, "ts": 676007793429.106, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007793469.670, "dur": 4.843, + "args": { + "External id": 444175,"Sequence number": 5285437, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6398 + } + }, + { + "ph": "s", "id": 163, "pid": 4183441, "tid": 4183441, "ts": 676007793469.670, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007793482.334, "dur": 60.718, + "args": { + "External id": 444176,"Sequence number": 5285438, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007793483.241, "dur": 6.782, + "args": { + "External id": 444177,"Sequence number": 5285438, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6400 + } + }, + { + "ph": "s", "id": 162, "pid": 4183441, "tid": 4183441, "ts": 676007793483.241, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007793485.780, "dur": 2.581, + "args": { + "External id": 444178,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007793487.545, "dur": 0.702, + "args": { + "External id": 444179,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007793490.821, "dur": 51.996, + "args": { + "External id": 444180,"Sequence number": 5285439, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007793491.928, "dur": 5.355, + "args": { + "External id": 444181,"Sequence number": 5285439, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007793493.350, "dur": 3.766, + "args": { + "External id": 444182,"Sequence number": 5285439, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6405 + } + }, + { + "ph": "s", "id": 161, "pid": 4183441, "tid": 4183441, "ts": 676007793493.350, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007793498.232, "dur": 38.469, + "args": { + "External id": 444183,"Sequence number": 5285440, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6406 + } + }, + { + "ph": "s", "id": 160, "pid": 4183441, "tid": 4183441, "ts": 676007793498.232, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007793538.392, "dur": 4.041, + "args": { + "External id": 444184,"Sequence number": 5285441, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6407 + } + }, + { + "ph": "s", "id": 159, "pid": 4183441, "tid": 4183441, "ts": 676007793538.392, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007793562.232, "dur": 4.828, + "args": { + "External id": 444185,"Sequence number": 5285442, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007793563.366, "dur": 3.563, + "args": { + "External id": 444186,"Sequence number": 5285442, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6409 + } + }, + { + "ph": "s", "id": 158, "pid": 4183441, "tid": 4183441, "ts": 676007793563.366, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007793576.129, "dur": 5.456, + "args": { + "External id": 444187,"Sequence number": 5285443, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007793577.281, "dur": 4.164, + "args": { + "External id": 444188,"Sequence number": 5285443, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6411 + } + }, + { + "ph": "s", "id": 157, "pid": 4183441, "tid": 4183441, "ts": 676007793577.281, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007793585.746, "dur": 3.438, + "args": { + "External id": 444189,"Sequence number": 5285444, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007793586.945, "dur": 1.883, + "args": { + "External id": 444190,"Sequence number": 5285444, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6413 + } + }, + { + "ph": "s", "id": 156, "pid": 4183441, "tid": 4183441, "ts": 676007793586.945, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007793623.792, "dur": 217.327, + "args": { + "External id": 444191,"Sequence number": 5285445, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6414 + } + }, + { + "ph": "s", "id": 155, "pid": 4183441, "tid": 4183441, "ts": 676007793623.792, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007793644.728, "dur": 44.631, + "args": { + "External id": 444192,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007793647.405, "dur": 40.962, + "args": { + "External id": 444193,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007793860.197, "dur": 113.595, + "args": { + "External id": 444194,"Sequence number": 5285446, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6417 + } + }, + { + "ph": "s", "id": 154, "pid": 4183441, "tid": 4183441, "ts": 676007793860.197, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007793874.910, "dur": 9.503, + "args": { + "External id": 444195,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007793877.420, "dur": 6.612, + "args": { + "External id": 444196,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183441, "tid": 4183441, + "ts": 676007794005.573, "dur": 205.630, + "args": { + "External id": 444197,"Sequence number": 5285447, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6420 + } + }, + { + "ph": "s", "id": 153, "pid": 4183441, "tid": 4183441, "ts": 676007794005.573, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007794034.582, "dur": 145.668, + "args": { + "External id": 444198,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007794080.575, "dur": 25.716, + "args": { + "External id": 444199,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007794099.621, "dur": 5.934, + "args": { + "External id": 444200,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007794109.045, "dur": 4.424, + "args": { + "External id": 444201,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007794114.840, "dur": 1.600, + "args": { + "External id": 444202,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007794119.099, "dur": 5.911, + "args": { + "External id": 444203,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 4183441, + "ts": 676007794194.309, "dur": 6.135, + "args": { + "External id": 444204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794217.010, "dur": 6.532, + "args": { + "External id": 444205,"Sequence number": 5285448, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794218.433, "dur": 4.947, + "args": { + "External id": 444206,"Sequence number": 5285448, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6429 + } + }, + { + "ph": "s", "id": 152, "pid": 4183441, "tid": 4183441, "ts": 676007794218.433, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007794238.193, "dur": 116.529, + "args": { + "External id": 444207,"Sequence number": 5285449, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007794240.000, "dur": 9.676, + "args": { + "External id": 444208,"Sequence number": 5285449, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6431 + } + }, + { + "ph": "s", "id": 151, "pid": 4183441, "tid": 4183441, "ts": 676007794240.000, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007794243.273, "dur": 5.067, + "args": { + "External id": 444209,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007794246.371, "dur": 1.667, + "args": { + "External id": 444210,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007794251.022, "dur": 103.383, + "args": { + "External id": 444211,"Sequence number": 5285450, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794253.318, "dur": 5.902, + "args": { + "External id": 444212,"Sequence number": 5285450, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794254.425, "dur": 4.650, + "args": { + "External id": 444213,"Sequence number": 5285450, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6436 + } + }, + { + "ph": "s", "id": 150, "pid": 4183441, "tid": 4183441, "ts": 676007794254.425, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007794260.633, "dur": 85.944, + "args": { + "External id": 444214,"Sequence number": 5285451, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6437 + } + }, + { + "ph": "s", "id": 149, "pid": 4183441, "tid": 4183441, "ts": 676007794260.633, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007794349.474, "dur": 4.240, + "args": { + "External id": 444215,"Sequence number": 5285452, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6438 + } + }, + { + "ph": "s", "id": 148, "pid": 4183441, "tid": 4183441, "ts": 676007794349.474, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007794393.486, "dur": 232.869, + "args": { + "External id": 444216,"Sequence number": 5285453, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6439 + } + }, + { + "ph": "s", "id": 147, "pid": 4183441, "tid": 4183441, "ts": 676007794393.486, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794413.445, "dur": 2.839, + "args": { + "External id": 444217,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794414.844, "dur": 1.308, + "args": { + "External id": 444218,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183441, "tid": 4183441, + "ts": 676007794422.865, "dur": 3.920, + "args": { + "External id": 444219,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794424.519, "dur": 2.163, + "args": { + "External id": 444220,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794425.540, "dur": 1.042, + "args": { + "External id": 444221,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007794435.195, "dur": 7.398, + "args": { + "External id": 444222,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007794437.494, "dur": 4.764, + "args": { + "External id": 444223,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007794449.569, "dur": 3.260, + "args": { + "External id": 444224,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007794456.734, "dur": 4.774, + "args": { + "External id": 444225,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794602.967, "dur": 5.736, + "args": { + "External id": 444226,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794604.277, "dur": 4.188, + "args": { + "External id": 444227,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794611.672, "dur": 3.152, + "args": { + "External id": 444228,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794613.176, "dur": 1.297, + "args": { + "External id": 444229,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007794648.351, "dur": 175.268, + "args": { + "External id": 444230,"Sequence number": 5285454, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007794649.475, "dur": 62.652, + "args": { + "External id": 444231,"Sequence number": 5285454, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6454 + } + }, + { + "ph": "s", "id": 146, "pid": 4183441, "tid": 4183441, "ts": 676007794649.475, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007794704.426, "dur": 5.640, + "args": { + "External id": 444232,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007794707.777, "dur": 1.754, + "args": { + "External id": 444233,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007794713.732, "dur": 109.531, + "args": { + "External id": 444234,"Sequence number": 5285455, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794715.772, "dur": 6.673, + "args": { + "External id": 444235,"Sequence number": 5285455, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794716.601, "dur": 5.693, + "args": { + "External id": 444236,"Sequence number": 5285455, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6459 + } + }, + { + "ph": "s", "id": 145, "pid": 4183441, "tid": 4183441, "ts": 676007794716.601, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007794723.410, "dur": 93.824, + "args": { + "External id": 444237,"Sequence number": 5285456, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6460 + } + }, + { + "ph": "s", "id": 144, "pid": 4183441, "tid": 4183441, "ts": 676007794723.410, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007794819.524, "dur": 2.960, + "args": { + "External id": 444238,"Sequence number": 5285457, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6461 + } + }, + { + "ph": "s", "id": 143, "pid": 4183441, "tid": 4183441, "ts": 676007794819.524, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007794836.973, "dur": 69.951, + "args": { + "External id": 444239,"Sequence number": 5285458, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007794837.899, "dur": 9.826, + "args": { + "External id": 444240,"Sequence number": 5285458, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6463 + } + }, + { + "ph": "s", "id": 142, "pid": 4183441, "tid": 4183441, "ts": 676007794837.899, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007794840.435, "dur": 5.998, + "args": { + "External id": 444241,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007794845.015, "dur": 1.179, + "args": { + "External id": 444242,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007794848.403, "dur": 58.285, + "args": { + "External id": 444243,"Sequence number": 5285459, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007794849.693, "dur": 5.193, + "args": { + "External id": 444244,"Sequence number": 5285459, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007794851.066, "dur": 3.693, + "args": { + "External id": 444245,"Sequence number": 5285459, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6468 + } + }, + { + "ph": "s", "id": 141, "pid": 4183441, "tid": 4183441, "ts": 676007794851.066, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007794855.559, "dur": 44.869, + "args": { + "External id": 444246,"Sequence number": 5285460, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6469 + } + }, + { + "ph": "s", "id": 140, "pid": 4183441, "tid": 4183441, "ts": 676007794855.559, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007794902.164, "dur": 4.191, + "args": { + "External id": 444247,"Sequence number": 5285461, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6470 + } + }, + { + "ph": "s", "id": 139, "pid": 4183441, "tid": 4183441, "ts": 676007794902.164, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007794932.115, "dur": 176.488, + "args": { + "External id": 444248,"Sequence number": 5285462, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6471 + } + }, + { + "ph": "s", "id": 138, "pid": 4183441, "tid": 4183441, "ts": 676007794932.115, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007794978.685, "dur": 4.592, + "args": { + "External id": 444249,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007795018.589, "dur": 57.675, + "args": { + "External id": 444250,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007795019.667, "dur": 4.976, + "args": { + "External id": 444251,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007795020.892, "dur": 2.820, + "args": { + "External id": 444252,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007795022.601, "dur": 0.960, + "args": { + "External id": 444253,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007795025.734, "dur": 50.220, + "args": { + "External id": 444254,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795027.415, "dur": 3.099, + "args": { + "External id": 444255,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795028.668, "dur": 1.735, + "args": { + "External id": 444256,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007795031.481, "dur": 40.665, + "args": { + "External id": 444257,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007795073.872, "dur": 1.444, + "args": { + "External id": 444258,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676007795120.362, "dur": 32.383, + "args": { + "External id": 444259,"Sequence number": 5285463, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6482 + } + }, + { + "ph": "s", "id": 137, "pid": 4183441, "tid": 4183441, "ts": 676007795120.362, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007795192.227, "dur": 198.105, + "args": { + "External id": 444260,"Sequence number": 5285464, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6483 + } + }, + { + "ph": "s", "id": 136, "pid": 4183441, "tid": 4183441, "ts": 676007795192.227, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795215.619, "dur": 3.780, + "args": { + "External id": 444261,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795216.955, "dur": 2.286, + "args": { + "External id": 444262,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007795227.635, "dur": 7.284, + "args": { + "External id": 444263,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007795230.477, "dur": 4.062, + "args": { + "External id": 444264,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007795240.952, "dur": 3.711, + "args": { + "External id": 444265,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795375.254, "dur": 4.824, + "args": { + "External id": 444266,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795378.457, "dur": 1.350, + "args": { + "External id": 444267,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007795408.945, "dur": 82.247, + "args": { + "External id": 444268,"Sequence number": 5285465, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007795410.019, "dur": 7.631, + "args": { + "External id": 444269,"Sequence number": 5285465, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6492 + } + }, + { + "ph": "s", "id": 135, "pid": 4183441, "tid": 4183441, "ts": 676007795410.019, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007795412.729, "dur": 3.736, + "args": { + "External id": 444270,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007795414.634, "dur": 1.632, + "args": { + "External id": 444271,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007795418.855, "dur": 72.118, + "args": { + "External id": 444272,"Sequence number": 5285466, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795421.038, "dur": 3.464, + "args": { + "External id": 444273,"Sequence number": 5285466, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795421.859, "dur": 2.492, + "args": { + "External id": 444274,"Sequence number": 5285466, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6497 + } + }, + { + "ph": "s", "id": 134, "pid": 4183441, "tid": 4183441, "ts": 676007795421.859, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007795425.380, "dur": 59.708, + "args": { + "External id": 444275,"Sequence number": 5285467, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6498 + } + }, + { + "ph": "s", "id": 133, "pid": 4183441, "tid": 4183441, "ts": 676007795425.380, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007795487.196, "dur": 3.084, + "args": { + "External id": 444276,"Sequence number": 5285468, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6499 + } + }, + { + "ph": "s", "id": 132, "pid": 4183441, "tid": 4183441, "ts": 676007795487.196, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007795499.500, "dur": 64.665, + "args": { + "External id": 444277,"Sequence number": 5285469, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007795500.144, "dur": 9.469, + "args": { + "External id": 444278,"Sequence number": 5285469, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6501 + } + }, + { + "ph": "s", "id": 131, "pid": 4183441, "tid": 4183441, "ts": 676007795500.144, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007795504.643, "dur": 3.661, + "args": { + "External id": 444279,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007795506.763, "dur": 1.412, + "args": { + "External id": 444280,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007795510.328, "dur": 53.577, + "args": { + "External id": 444281,"Sequence number": 5285470, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795511.390, "dur": 6.343, + "args": { + "External id": 444282,"Sequence number": 5285470, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795512.600, "dur": 4.982, + "args": { + "External id": 444283,"Sequence number": 5285470, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6506 + } + }, + { + "ph": "s", "id": 130, "pid": 4183441, "tid": 4183441, "ts": 676007795512.600, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007795518.621, "dur": 38.651, + "args": { + "External id": 444284,"Sequence number": 5285471, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6507 + } + }, + { + "ph": "s", "id": 129, "pid": 4183441, "tid": 4183441, "ts": 676007795518.621, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007795558.899, "dur": 4.566, + "args": { + "External id": 444285,"Sequence number": 5285472, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6508 + } + }, + { + "ph": "s", "id": 128, "pid": 4183441, "tid": 4183441, "ts": 676007795558.899, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007795570.723, "dur": 57.508, + "args": { + "External id": 444286,"Sequence number": 5285473, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007795571.454, "dur": 5.556, + "args": { + "External id": 444287,"Sequence number": 5285473, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6510 + } + }, + { + "ph": "s", "id": 127, "pid": 4183441, "tid": 4183441, "ts": 676007795571.454, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007795573.570, "dur": 2.351, + "args": { + "External id": 444288,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007795575.142, "dur": 0.634, + "args": { + "External id": 444289,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007795577.872, "dur": 50.167, + "args": { + "External id": 444290,"Sequence number": 5285474, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795579.246, "dur": 5.573, + "args": { + "External id": 444291,"Sequence number": 5285474, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795580.629, "dur": 4.039, + "args": { + "External id": 444292,"Sequence number": 5285474, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6515 + } + }, + { + "ph": "s", "id": 126, "pid": 4183441, "tid": 4183441, "ts": 676007795580.629, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007795585.439, "dur": 37.360, + "args": { + "External id": 444293,"Sequence number": 5285475, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6516 + } + }, + { + "ph": "s", "id": 125, "pid": 4183441, "tid": 4183441, "ts": 676007795585.439, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007795624.336, "dur": 3.266, + "args": { + "External id": 444294,"Sequence number": 5285476, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6517 + } + }, + { + "ph": "s", "id": 124, "pid": 4183441, "tid": 4183441, "ts": 676007795624.336, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795643.400, "dur": 4.033, + "args": { + "External id": 444295,"Sequence number": 5285477, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795644.589, "dur": 2.698, + "args": { + "External id": 444296,"Sequence number": 5285477, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6519 + } + }, + { + "ph": "s", "id": 123, "pid": 4183441, "tid": 4183441, "ts": 676007795644.589, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795705.453, "dur": 6.569, + "args": { + "External id": 444297,"Sequence number": 5285478, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795706.500, "dur": 5.286, + "args": { + "External id": 444298,"Sequence number": 5285478, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6521 + } + }, + { + "ph": "s", "id": 122, "pid": 4183441, "tid": 4183441, "ts": 676007795706.500, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007795717.393, "dur": 5.059, + "args": { + "External id": 444299,"Sequence number": 5285479, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007795718.580, "dur": 3.715, + "args": { + "External id": 444300,"Sequence number": 5285479, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6523 + } + }, + { + "ph": "s", "id": 121, "pid": 4183441, "tid": 4183441, "ts": 676007795718.580, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007795754.136, "dur": 165.595, + "args": { + "External id": 444301,"Sequence number": 5285480, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6524 + } + }, + { + "ph": "s", "id": 120, "pid": 4183441, "tid": 4183441, "ts": 676007795754.136, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007795775.057, "dur": 9.233, + "args": { + "External id": 444302,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007795777.777, "dur": 6.116, + "args": { + "External id": 444303,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007795933.154, "dur": 105.086, + "args": { + "External id": 444304,"Sequence number": 5285481, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6527 + } + }, + { + "ph": "s", "id": 119, "pid": 4183441, "tid": 4183441, "ts": 676007795933.154, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007795946.926, "dur": 7.488, + "args": { + "External id": 444305,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007795949.767, "dur": 4.327, + "args": { + "External id": 444306,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183441, "tid": 4183441, + "ts": 676007796067.004, "dur": 198.394, + "args": { + "External id": 444307,"Sequence number": 5285482, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6530 + } + }, + { + "ph": "s", "id": 118, "pid": 4183441, "tid": 4183441, "ts": 676007796067.004, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007796110.115, "dur": 128.323, + "args": { + "External id": 444308,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007796157.538, "dur": 8.699, + "args": { + "External id": 444309,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007796160.389, "dur": 5.077, + "args": { + "External id": 444310,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007796168.755, "dur": 4.207, + "args": { + "External id": 444311,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007796174.442, "dur": 1.579, + "args": { + "External id": 444312,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007796180.524, "dur": 3.258, + "args": { + "External id": 444313,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 4183441, + "ts": 676007796250.343, "dur": 4.916, + "args": { + "External id": 444314,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796270.539, "dur": 6.117, + "args": { + "External id": 444315,"Sequence number": 5285483, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796271.800, "dur": 4.722, + "args": { + "External id": 444316,"Sequence number": 5285483, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6539 + } + }, + { + "ph": "s", "id": 117, "pid": 4183441, "tid": 4183441, "ts": 676007796271.800, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007796288.162, "dur": 104.923, + "args": { + "External id": 444317,"Sequence number": 5285484, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007796289.669, "dur": 8.712, + "args": { + "External id": 444318,"Sequence number": 5285484, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6541 + } + }, + { + "ph": "s", "id": 116, "pid": 4183441, "tid": 4183441, "ts": 676007796289.669, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007796292.808, "dur": 4.538, + "args": { + "External id": 444319,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007796295.282, "dur": 1.802, + "args": { + "External id": 444320,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007796300.041, "dur": 92.830, + "args": { + "External id": 444321,"Sequence number": 5285485, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796302.052, "dur": 3.803, + "args": { + "External id": 444322,"Sequence number": 5285485, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796303.266, "dur": 2.457, + "args": { + "External id": 444323,"Sequence number": 5285485, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6546 + } + }, + { + "ph": "s", "id": 115, "pid": 4183441, "tid": 4183441, "ts": 676007796303.266, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007796307.033, "dur": 80.044, + "args": { + "External id": 444324,"Sequence number": 5285486, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6547 + } + }, + { + "ph": "s", "id": 114, "pid": 4183441, "tid": 4183441, "ts": 676007796307.033, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007796389.205, "dur": 2.884, + "args": { + "External id": 444325,"Sequence number": 5285487, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6548 + } + }, + { + "ph": "s", "id": 113, "pid": 4183441, "tid": 4183441, "ts": 676007796389.205, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007796425.417, "dur": 213.935, + "args": { + "External id": 444326,"Sequence number": 5285488, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6549 + } + }, + { + "ph": "s", "id": 112, "pid": 4183441, "tid": 4183441, "ts": 676007796425.417, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796446.066, "dur": 3.133, + "args": { + "External id": 444327,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796447.393, "dur": 1.666, + "args": { + "External id": 444328,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183441, "tid": 4183441, + "ts": 676007796454.119, "dur": 3.449, + "args": { + "External id": 444329,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796455.579, "dur": 1.878, + "args": { + "External id": 444330,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796456.566, "dur": 0.762, + "args": { + "External id": 444331,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007796465.138, "dur": 6.963, + "args": { + "External id": 444332,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007796467.310, "dur": 4.459, + "args": { + "External id": 444333,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007796478.411, "dur": 3.134, + "args": { + "External id": 444334,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007796485.404, "dur": 3.336, + "args": { + "External id": 444335,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796617.532, "dur": 5.701, + "args": { + "External id": 444336,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796621.057, "dur": 1.879, + "args": { + "External id": 444337,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796625.731, "dur": 2.346, + "args": { + "External id": 444338,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796626.665, "dur": 1.291, + "args": { + "External id": 444339,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007796700.876, "dur": 123.382, + "args": { + "External id": 444340,"Sequence number": 5285489, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007796702.061, "dur": 10.274, + "args": { + "External id": 444341,"Sequence number": 5285489, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6564 + } + }, + { + "ph": "s", "id": 111, "pid": 4183441, "tid": 4183441, "ts": 676007796702.061, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007796705.092, "dur": 5.706, + "args": { + "External id": 444342,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007796708.101, "dur": 2.280, + "args": { + "External id": 444343,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007796713.558, "dur": 110.315, + "args": { + "External id": 444344,"Sequence number": 5285490, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796715.557, "dur": 5.660, + "args": { + "External id": 444345,"Sequence number": 5285490, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796716.337, "dur": 4.714, + "args": { + "External id": 444346,"Sequence number": 5285490, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6569 + } + }, + { + "ph": "s", "id": 110, "pid": 4183441, "tid": 4183441, "ts": 676007796716.337, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007796721.955, "dur": 75.090, + "args": { + "External id": 444347,"Sequence number": 5285491, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6570 + } + }, + { + "ph": "s", "id": 109, "pid": 4183441, "tid": 4183441, "ts": 676007796721.955, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007796814.769, "dur": 8.356, + "args": { + "External id": 444348,"Sequence number": 5285492, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6571 + } + }, + { + "ph": "s", "id": 108, "pid": 4183441, "tid": 4183441, "ts": 676007796814.769, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007796833.984, "dur": 67.190, + "args": { + "External id": 444349,"Sequence number": 5285493, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007796834.808, "dur": 7.567, + "args": { + "External id": 444350,"Sequence number": 5285493, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6573 + } + }, + { + "ph": "s", "id": 107, "pid": 4183441, "tid": 4183441, "ts": 676007796834.808, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007796837.091, "dur": 3.828, + "args": { + "External id": 444351,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007796839.105, "dur": 1.445, + "args": { + "External id": 444352,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007796843.140, "dur": 57.752, + "args": { + "External id": 444353,"Sequence number": 5285494, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007796844.816, "dur": 5.126, + "args": { + "External id": 444354,"Sequence number": 5285494, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007796845.904, "dur": 3.908, + "args": { + "External id": 444355,"Sequence number": 5285494, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6578 + } + }, + { + "ph": "s", "id": 106, "pid": 4183441, "tid": 4183441, "ts": 676007796845.904, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007796850.950, "dur": 45.590, + "args": { + "External id": 444356,"Sequence number": 5285495, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6579 + } + }, + { + "ph": "s", "id": 105, "pid": 4183441, "tid": 4183441, "ts": 676007796850.950, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007796898.339, "dur": 2.198, + "args": { + "External id": 444357,"Sequence number": 5285496, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6580 + } + }, + { + "ph": "s", "id": 104, "pid": 4183441, "tid": 4183441, "ts": 676007796898.339, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007796926.140, "dur": 146.326, + "args": { + "External id": 444358,"Sequence number": 5285497, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6581 + } + }, + { + "ph": "s", "id": 103, "pid": 4183441, "tid": 4183441, "ts": 676007796926.140, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007796965.800, "dur": 4.466, + "args": { + "External id": 444359,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007797000.769, "dur": 57.107, + "args": { + "External id": 444360,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007797001.437, "dur": 7.793, + "args": { + "External id": 444361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007797002.614, "dur": 5.532, + "args": { + "External id": 444362,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007797007.250, "dur": 0.681, + "args": { + "External id": 444363,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007797010.108, "dur": 47.470, + "args": { + "External id": 444364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797011.818, "dur": 2.209, + "args": { + "External id": 444365,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797012.623, "dur": 1.283, + "args": { + "External id": 444366,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007797015.074, "dur": 39.090, + "args": { + "External id": 444367,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007797055.693, "dur": 1.177, + "args": { + "External id": 444368,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676007797081.046, "dur": 44.537, + "args": { + "External id": 444369,"Sequence number": 5285498, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6592 + } + }, + { + "ph": "s", "id": 102, "pid": 4183441, "tid": 4183441, "ts": 676007797081.046, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007797164.090, "dur": 190.964, + "args": { + "External id": 444370,"Sequence number": 5285499, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6593 + } + }, + { + "ph": "s", "id": 101, "pid": 4183441, "tid": 4183441, "ts": 676007797164.090, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797184.456, "dur": 4.208, + "args": { + "External id": 444371,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797185.821, "dur": 2.586, + "args": { + "External id": 444372,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007797196.969, "dur": 7.949, + "args": { + "External id": 444373,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007797199.987, "dur": 4.517, + "args": { + "External id": 444374,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007797211.013, "dur": 3.873, + "args": { + "External id": 444375,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797340.239, "dur": 2.703, + "args": { + "External id": 444376,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797341.048, "dur": 1.697, + "args": { + "External id": 444377,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007797374.710, "dur": 92.125, + "args": { + "External id": 444378,"Sequence number": 5285500, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007797375.926, "dur": 8.161, + "args": { + "External id": 444379,"Sequence number": 5285500, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6602 + } + }, + { + "ph": "s", "id": 100, "pid": 4183441, "tid": 4183441, "ts": 676007797375.926, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007797378.706, "dur": 4.023, + "args": { + "External id": 444380,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007797380.611, "dur": 1.967, + "args": { + "External id": 444381,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007797385.014, "dur": 81.582, + "args": { + "External id": 444382,"Sequence number": 5285501, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797386.664, "dur": 4.513, + "args": { + "External id": 444383,"Sequence number": 5285501, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797387.745, "dur": 3.280, + "args": { + "External id": 444384,"Sequence number": 5285501, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6607 + } + }, + { + "ph": "s", "id": 99, "pid": 4183441, "tid": 4183441, "ts": 676007797387.745, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007797391.992, "dur": 64.413, + "args": { + "External id": 444385,"Sequence number": 5285502, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6608 + } + }, + { + "ph": "s", "id": 98, "pid": 4183441, "tid": 4183441, "ts": 676007797391.992, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007797458.421, "dur": 7.390, + "args": { + "External id": 444386,"Sequence number": 5285503, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6609 + } + }, + { + "ph": "s", "id": 97, "pid": 4183441, "tid": 4183441, "ts": 676007797458.421, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007797474.457, "dur": 60.493, + "args": { + "External id": 444387,"Sequence number": 5285504, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007797475.073, "dur": 5.986, + "args": { + "External id": 444388,"Sequence number": 5285504, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6611 + } + }, + { + "ph": "s", "id": 96, "pid": 4183441, "tid": 4183441, "ts": 676007797475.073, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007797476.853, "dur": 2.922, + "args": { + "External id": 444389,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007797478.589, "dur": 1.029, + "args": { + "External id": 444390,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007797481.701, "dur": 53.049, + "args": { + "External id": 444391,"Sequence number": 5285505, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797483.507, "dur": 3.580, + "args": { + "External id": 444392,"Sequence number": 5285505, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797484.716, "dur": 2.232, + "args": { + "External id": 444393,"Sequence number": 5285505, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6616 + } + }, + { + "ph": "s", "id": 95, "pid": 4183441, "tid": 4183441, "ts": 676007797484.716, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007797487.610, "dur": 42.534, + "args": { + "External id": 444394,"Sequence number": 5285506, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6617 + } + }, + { + "ph": "s", "id": 94, "pid": 4183441, "tid": 4183441, "ts": 676007797487.610, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007797532.112, "dur": 2.265, + "args": { + "External id": 444395,"Sequence number": 5285507, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6618 + } + }, + { + "ph": "s", "id": 93, "pid": 4183441, "tid": 4183441, "ts": 676007797532.112, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007797541.554, "dur": 56.974, + "args": { + "External id": 444396,"Sequence number": 5285508, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007797541.936, "dur": 6.581, + "args": { + "External id": 444397,"Sequence number": 5285508, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6620 + } + }, + { + "ph": "s", "id": 92, "pid": 4183441, "tid": 4183441, "ts": 676007797541.936, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007797543.842, "dur": 3.493, + "args": { + "External id": 444398,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007797545.729, "dur": 1.408, + "args": { + "External id": 444399,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007797549.206, "dur": 49.142, + "args": { + "External id": 444400,"Sequence number": 5285509, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797550.544, "dur": 4.645, + "args": { + "External id": 444401,"Sequence number": 5285509, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797551.559, "dur": 3.480, + "args": { + "External id": 444402,"Sequence number": 5285509, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6625 + } + }, + { + "ph": "s", "id": 91, "pid": 4183441, "tid": 4183441, "ts": 676007797551.559, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007797555.903, "dur": 37.469, + "args": { + "External id": 444403,"Sequence number": 5285510, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6626 + } + }, + { + "ph": "s", "id": 90, "pid": 4183441, "tid": 4183441, "ts": 676007797555.903, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007797595.340, "dur": 2.664, + "args": { + "External id": 444404,"Sequence number": 5285511, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6627 + } + }, + { + "ph": "s", "id": 89, "pid": 4183441, "tid": 4183441, "ts": 676007797595.340, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797613.274, "dur": 4.656, + "args": { + "External id": 444405,"Sequence number": 5285512, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797614.584, "dur": 3.208, + "args": { + "External id": 444406,"Sequence number": 5285512, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6629 + } + }, + { + "ph": "s", "id": 88, "pid": 4183441, "tid": 4183441, "ts": 676007797614.584, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797624.209, "dur": 5.744, + "args": { + "External id": 444407,"Sequence number": 5285513, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797625.470, "dur": 4.327, + "args": { + "External id": 444408,"Sequence number": 5285513, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6631 + } + }, + { + "ph": "s", "id": 87, "pid": 4183441, "tid": 4183441, "ts": 676007797625.470, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007797633.922, "dur": 3.752, + "args": { + "External id": 444409,"Sequence number": 5285514, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007797635.118, "dur": 2.213, + "args": { + "External id": 444410,"Sequence number": 5285514, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6633 + } + }, + { + "ph": "s", "id": 86, "pid": 4183441, "tid": 4183441, "ts": 676007797635.118, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007797706.313, "dur": 161.709, + "args": { + "External id": 444411,"Sequence number": 5285515, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6634 + } + }, + { + "ph": "s", "id": 85, "pid": 4183441, "tid": 4183441, "ts": 676007797706.313, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007797728.043, "dur": 9.745, + "args": { + "External id": 444412,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007797730.880, "dur": 6.250, + "args": { + "External id": 444413,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007797880.180, "dur": 104.122, + "args": { + "External id": 444414,"Sequence number": 5285516, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6637 + } + }, + { + "ph": "s", "id": 84, "pid": 4183441, "tid": 4183441, "ts": 676007797880.180, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007797893.310, "dur": 6.671, + "args": { + "External id": 444415,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007797895.436, "dur": 4.275, + "args": { + "External id": 444416,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183441, "tid": 4183441, + "ts": 676007798036.801, "dur": 206.109, + "args": { + "External id": 444417,"Sequence number": 5285517, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6640 + } + }, + { + "ph": "s", "id": 83, "pid": 4183441, "tid": 4183441, "ts": 676007798036.801, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007798064.093, "dur": 150.306, + "args": { + "External id": 444418,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007798131.663, "dur": 11.094, + "args": { + "External id": 444419,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007798134.039, "dur": 7.745, + "args": { + "External id": 444420,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007798147.986, "dur": 4.407, + "args": { + "External id": 444421,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007798153.882, "dur": 1.450, + "args": { + "External id": 444422,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007798157.920, "dur": 3.156, + "args": { + "External id": 444423,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 4183441, + "ts": 676007798226.971, "dur": 4.901, + "args": { + "External id": 444424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798247.681, "dur": 6.018, + "args": { + "External id": 444425,"Sequence number": 5285518, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798249.157, "dur": 4.393, + "args": { + "External id": 444426,"Sequence number": 5285518, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6649 + } + }, + { + "ph": "s", "id": 82, "pid": 4183441, "tid": 4183441, "ts": 676007798249.157, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007798267.768, "dur": 110.072, + "args": { + "External id": 444427,"Sequence number": 5285519, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007798269.276, "dur": 10.781, + "args": { + "External id": 444428,"Sequence number": 5285519, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6651 + } + }, + { + "ph": "s", "id": 81, "pid": 4183441, "tid": 4183441, "ts": 676007798269.276, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007798274.420, "dur": 4.433, + "args": { + "External id": 444429,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007798277.003, "dur": 1.591, + "args": { + "External id": 444430,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007798281.941, "dur": 95.564, + "args": { + "External id": 444431,"Sequence number": 5285520, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798284.044, "dur": 3.237, + "args": { + "External id": 444432,"Sequence number": 5285520, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798285.074, "dur": 2.069, + "args": { + "External id": 444433,"Sequence number": 5285520, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6656 + } + }, + { + "ph": "s", "id": 80, "pid": 4183441, "tid": 4183441, "ts": 676007798285.074, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007798288.825, "dur": 79.575, + "args": { + "External id": 444434,"Sequence number": 5285521, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6657 + } + }, + { + "ph": "s", "id": 79, "pid": 4183441, "tid": 4183441, "ts": 676007798288.825, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007798370.596, "dur": 6.187, + "args": { + "External id": 444435,"Sequence number": 5285522, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6658 + } + }, + { + "ph": "s", "id": 78, "pid": 4183441, "tid": 4183441, "ts": 676007798370.596, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007798411.127, "dur": 199.006, + "args": { + "External id": 444436,"Sequence number": 5285523, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6659 + } + }, + { + "ph": "s", "id": 77, "pid": 4183441, "tid": 4183441, "ts": 676007798411.127, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798428.595, "dur": 2.800, + "args": { + "External id": 444437,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798429.743, "dur": 1.486, + "args": { + "External id": 444438,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183441, "tid": 4183441, + "ts": 676007798435.539, "dur": 3.805, + "args": { + "External id": 444439,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798436.839, "dur": 2.378, + "args": { + "External id": 444440,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798437.841, "dur": 1.263, + "args": { + "External id": 444441,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007798446.396, "dur": 6.995, + "args": { + "External id": 444442,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007798448.646, "dur": 4.425, + "args": { + "External id": 444443,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007798459.270, "dur": 3.160, + "args": { + "External id": 444444,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007798466.013, "dur": 3.229, + "args": { + "External id": 444445,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798589.323, "dur": 3.331, + "args": { + "External id": 444446,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798590.341, "dur": 2.038, + "args": { + "External id": 444447,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798595.141, "dur": 2.189, + "args": { + "External id": 444448,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798596.227, "dur": 1.000, + "args": { + "External id": 444449,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007798626.250, "dur": 129.710, + "args": { + "External id": 444450,"Sequence number": 5285524, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007798627.302, "dur": 6.799, + "args": { + "External id": 444451,"Sequence number": 5285524, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6674 + } + }, + { + "ph": "s", "id": 76, "pid": 4183441, "tid": 4183441, "ts": 676007798627.302, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007798629.359, "dur": 3.506, + "args": { + "External id": 444452,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007798631.292, "dur": 1.330, + "args": { + "External id": 444453,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007798635.214, "dur": 120.473, + "args": { + "External id": 444454,"Sequence number": 5285525, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798637.041, "dur": 3.188, + "args": { + "External id": 444455,"Sequence number": 5285525, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798638.047, "dur": 1.999, + "args": { + "External id": 444456,"Sequence number": 5285525, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6679 + } + }, + { + "ph": "s", "id": 75, "pid": 4183441, "tid": 4183441, "ts": 676007798638.047, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007798640.964, "dur": 104.933, + "args": { + "External id": 444457,"Sequence number": 5285526, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6680 + } + }, + { + "ph": "s", "id": 74, "pid": 4183441, "tid": 4183441, "ts": 676007798640.964, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007798749.490, "dur": 5.540, + "args": { + "External id": 444458,"Sequence number": 5285527, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6681 + } + }, + { + "ph": "s", "id": 73, "pid": 4183441, "tid": 4183441, "ts": 676007798749.490, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007798765.918, "dur": 68.350, + "args": { + "External id": 444459,"Sequence number": 5285528, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007798766.734, "dur": 7.176, + "args": { + "External id": 444460,"Sequence number": 5285528, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6683 + } + }, + { + "ph": "s", "id": 72, "pid": 4183441, "tid": 4183441, "ts": 676007798766.734, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007798768.720, "dur": 3.939, + "args": { + "External id": 444461,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007798771.064, "dur": 1.402, + "args": { + "External id": 444462,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007798774.892, "dur": 59.176, + "args": { + "External id": 444463,"Sequence number": 5285529, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798776.472, "dur": 7.185, + "args": { + "External id": 444464,"Sequence number": 5285529, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798777.766, "dur": 5.701, + "args": { + "External id": 444465,"Sequence number": 5285529, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6688 + } + }, + { + "ph": "s", "id": 71, "pid": 4183441, "tid": 4183441, "ts": 676007798777.766, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007798784.184, "dur": 42.948, + "args": { + "External id": 444466,"Sequence number": 5285530, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6689 + } + }, + { + "ph": "s", "id": 70, "pid": 4183441, "tid": 4183441, "ts": 676007798784.184, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007798829.053, "dur": 4.634, + "args": { + "External id": 444467,"Sequence number": 5285531, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6690 + } + }, + { + "ph": "s", "id": 69, "pid": 4183441, "tid": 4183441, "ts": 676007798829.053, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007798855.167, "dur": 142.133, + "args": { + "External id": 444468,"Sequence number": 5285532, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6691 + } + }, + { + "ph": "s", "id": 68, "pid": 4183441, "tid": 4183441, "ts": 676007798855.167, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007798895.265, "dur": 4.327, + "args": { + "External id": 444469,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007798929.080, "dur": 54.894, + "args": { + "External id": 444470,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007798929.779, "dur": 4.879, + "args": { + "External id": 444471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007798930.707, "dur": 3.158, + "args": { + "External id": 444472,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007798932.740, "dur": 0.937, + "args": { + "External id": 444473,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007798935.313, "dur": 48.343, + "args": { + "External id": 444474,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007798936.892, "dur": 2.456, + "args": { + "External id": 444475,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007798938.224, "dur": 1.002, + "args": { + "External id": 444476,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007798940.291, "dur": 39.408, + "args": { + "External id": 444477,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007798981.474, "dur": 1.625, + "args": { + "External id": 444478,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676007799005.619, "dur": 23.919, + "args": { + "External id": 444479,"Sequence number": 5285533, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6702 + } + }, + { + "ph": "s", "id": 67, "pid": 4183441, "tid": 4183441, "ts": 676007799005.619, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007799062.953, "dur": 211.269, + "args": { + "External id": 444480,"Sequence number": 5285534, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [], [], [], [], []], "Ev Idx": 6703 + } + }, + { + "ph": "s", "id": 66, "pid": 4183441, "tid": 4183441, "ts": 676007799062.953, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799098.799, "dur": 4.640, + "args": { + "External id": 444481,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799100.284, "dur": 2.595, + "args": { + "External id": 444482,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007799112.146, "dur": 8.616, + "args": { + "External id": 444483,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007799115.430, "dur": 4.937, + "args": { + "External id": 444484,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007799127.038, "dur": 3.624, + "args": { + "External id": 444485,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799257.825, "dur": 3.600, + "args": { + "External id": 444486,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799259.135, "dur": 2.085, + "args": { + "External id": 444487,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007799292.501, "dur": 93.804, + "args": { + "External id": 444488,"Sequence number": 5285535, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007799293.398, "dur": 7.302, + "args": { + "External id": 444489,"Sequence number": 5285535, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6712 + } + }, + { + "ph": "s", "id": 65, "pid": 4183441, "tid": 4183441, "ts": 676007799293.398, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007799295.753, "dur": 3.729, + "args": { + "External id": 444490,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007799297.876, "dur": 1.410, + "args": { + "External id": 444491,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007799301.907, "dur": 84.164, + "args": { + "External id": 444492,"Sequence number": 5285536, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799303.622, "dur": 11.057, + "args": { + "External id": 444493,"Sequence number": 5285536, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799311.026, "dur": 3.522, + "args": { + "External id": 444494,"Sequence number": 5285536, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6717 + } + }, + { + "ph": "s", "id": 64, "pid": 4183441, "tid": 4183441, "ts": 676007799311.026, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007799315.797, "dur": 64.904, + "args": { + "External id": 444495,"Sequence number": 5285537, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6718 + } + }, + { + "ph": "s", "id": 63, "pid": 4183441, "tid": 4183441, "ts": 676007799315.797, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007799382.628, "dur": 2.824, + "args": { + "External id": 444496,"Sequence number": 5285538, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6719 + } + }, + { + "ph": "s", "id": 62, "pid": 4183441, "tid": 4183441, "ts": 676007799382.628, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007799394.721, "dur": 60.342, + "args": { + "External id": 444497,"Sequence number": 5285539, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007799395.419, "dur": 6.134, + "args": { + "External id": 444498,"Sequence number": 5285539, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6721 + } + }, + { + "ph": "s", "id": 61, "pid": 4183441, "tid": 4183441, "ts": 676007799395.419, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007799397.483, "dur": 2.918, + "args": { + "External id": 444499,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007799399.583, "dur": 0.667, + "args": { + "External id": 444500,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007799402.358, "dur": 52.482, + "args": { + "External id": 444501,"Sequence number": 5285540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799403.635, "dur": 4.133, + "args": { + "External id": 444502,"Sequence number": 5285540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799404.681, "dur": 2.936, + "args": { + "External id": 444503,"Sequence number": 5285540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6726 + } + }, + { + "ph": "s", "id": 60, "pid": 4183441, "tid": 4183441, "ts": 676007799404.681, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007799408.239, "dur": 40.567, + "args": { + "External id": 444504,"Sequence number": 5285541, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6727 + } + }, + { + "ph": "s", "id": 59, "pid": 4183441, "tid": 4183441, "ts": 676007799408.239, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007799450.443, "dur": 4.090, + "args": { + "External id": 444505,"Sequence number": 5285542, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6728 + } + }, + { + "ph": "s", "id": 58, "pid": 4183441, "tid": 4183441, "ts": 676007799450.443, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007799462.396, "dur": 57.778, + "args": { + "External id": 444506,"Sequence number": 5285543, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007799462.885, "dur": 8.673, + "args": { + "External id": 444507,"Sequence number": 5285543, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6730 + } + }, + { + "ph": "s", "id": 57, "pid": 4183441, "tid": 4183441, "ts": 676007799462.885, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007799464.730, "dur": 5.522, + "args": { + "External id": 444508,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007799466.917, "dur": 3.158, + "args": { + "External id": 444509,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007799472.321, "dur": 47.649, + "args": { + "External id": 444510,"Sequence number": 5285544, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799473.411, "dur": 4.715, + "args": { + "External id": 444511,"Sequence number": 5285544, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799474.311, "dur": 3.676, + "args": { + "External id": 444512,"Sequence number": 5285544, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6735 + } + }, + { + "ph": "s", "id": 56, "pid": 4183441, "tid": 4183441, "ts": 676007799474.311, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007799478.719, "dur": 34.685, + "args": { + "External id": 444513,"Sequence number": 5285545, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6736 + } + }, + { + "ph": "s", "id": 55, "pid": 4183441, "tid": 4183441, "ts": 676007799478.719, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007799515.183, "dur": 4.447, + "args": { + "External id": 444514,"Sequence number": 5285546, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6737 + } + }, + { + "ph": "s", "id": 54, "pid": 4183441, "tid": 4183441, "ts": 676007799515.183, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799535.635, "dur": 3.195, + "args": { + "External id": 444515,"Sequence number": 5285547, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799536.268, "dur": 2.407, + "args": { + "External id": 444516,"Sequence number": 5285547, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6739 + } + }, + { + "ph": "s", "id": 53, "pid": 4183441, "tid": 4183441, "ts": 676007799536.268, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799545.060, "dur": 3.480, + "args": { + "External id": 444517,"Sequence number": 5285548, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799546.265, "dur": 2.133, + "args": { + "External id": 444518,"Sequence number": 5285548, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6741 + } + }, + { + "ph": "s", "id": 52, "pid": 4183441, "tid": 4183441, "ts": 676007799546.265, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007799552.715, "dur": 3.525, + "args": { + "External id": 444519,"Sequence number": 5285549, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007799554.250, "dur": 1.874, + "args": { + "External id": 444520,"Sequence number": 5285549, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 16, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6743 + } + }, + { + "ph": "s", "id": 51, "pid": 4183441, "tid": 4183441, "ts": 676007799554.250, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007799584.915, "dur": 193.419, + "args": { + "External id": 444521,"Sequence number": 5285550, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6744 + } + }, + { + "ph": "s", "id": 50, "pid": 4183441, "tid": 4183441, "ts": 676007799584.915, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007799602.526, "dur": 8.863, + "args": { + "External id": 444522,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007799604.787, "dur": 6.077, + "args": { + "External id": 444523,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007799802.027, "dur": 106.960, + "args": { + "External id": 444524,"Sequence number": 5285551, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 6747 + } + }, + { + "ph": "s", "id": 49, "pid": 4183441, "tid": 4183441, "ts": 676007799802.027, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007799816.097, "dur": 8.546, + "args": { + "External id": 444525,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007799818.732, "dur": 5.539, + "args": { + "External id": 444526,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 4183441, "tid": 4183441, + "ts": 676007799936.144, "dur": 194.824, + "args": { + "External id": 444527,"Sequence number": 5285552, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 6750 + } + }, + { + "ph": "s", "id": 48, "pid": 4183441, "tid": 4183441, "ts": 676007799936.144, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007799962.304, "dur": 138.685, + "args": { + "External id": 444528,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [4194304, 1024, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [16, 4096, 16, 64], [16, 4096, 16, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007800010.994, "dur": 6.814, + "args": { + "External id": 444529,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[4194304, 1024, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 16, 64], [], [], [], [], []], "Ev Idx": 6752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007800013.168, "dur": 4.146, + "args": { + "External id": 444530,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 16, 64]", "[4194304, 1024, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007800020.652, "dur": 4.094, + "args": { + "External id": 444531,"Record function id": 0, "Concrete Inputs": ["[16, 16, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007800026.116, "dur": 1.461, + "args": { + "External id": 444532,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007800030.420, "dur": 4.767, + "args": { + "External id": 444533,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 4183441, "tid": 4183441, + "ts": 676007800114.902, "dur": 5.228, + "args": { + "External id": 444534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[4194304, 1024, 64, 1]], "Input Dims": [[16, 4096, 16, 64]], "Ev Idx": 6757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800136.098, "dur": 6.474, + "args": { + "External id": 444535,"Sequence number": 5285553, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800137.274, "dur": 5.166, + "args": { + "External id": 444536,"Sequence number": 5285553, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 64, 1], []], "Input Dims": [[16, 4096, 16, 64], []], "Ev Idx": 6759 + } + }, + { + "ph": "s", "id": 47, "pid": 4183441, "tid": 4183441, "ts": 676007800137.274, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007800155.085, "dur": 104.822, + "args": { + "External id": 444537,"Sequence number": 5285554, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [1024, 1024], []], "Ev Idx": 6760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007800156.118, "dur": 8.728, + "args": { + "External id": 444538,"Sequence number": 5285554, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[1024, 1024]], "Ev Idx": 6761 + } + }, + { + "ph": "s", "id": 46, "pid": 4183441, "tid": 4183441, "ts": 676007800156.118, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007800159.025, "dur": 4.690, + "args": { + "External id": 444539,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[1024, 1024], [], []], "Ev Idx": 6762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007800161.893, "dur": 1.590, + "args": { + "External id": 444540,"Record function id": 0, "Concrete Inputs": ["", "[1024, 1024]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[1024, 1024], [], [], []], "Ev Idx": 6763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007800166.358, "dur": 93.231, + "args": { + "External id": 444541,"Sequence number": 5285555, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 1024]], "Ev Idx": 6764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800168.459, "dur": 3.700, + "args": { + "External id": 444542,"Sequence number": 5285555, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800169.579, "dur": 2.440, + "args": { + "External id": 444543,"Sequence number": 5285555, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6766 + } + }, + { + "ph": "s", "id": 45, "pid": 4183441, "tid": 4183441, "ts": 676007800169.579, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007800173.525, "dur": 78.987, + "args": { + "External id": 444544,"Sequence number": 5285556, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 1024]], "Ev Idx": 6767 + } + }, + { + "ph": "s", "id": 44, "pid": 4183441, "tid": 4183441, "ts": 676007800173.525, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007800254.686, "dur": 4.131, + "args": { + "External id": 444545,"Sequence number": 5285557, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6768 + } + }, + { + "ph": "s", "id": 43, "pid": 4183441, "tid": 4183441, "ts": 676007800254.686, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007800292.811, "dur": 199.391, + "args": { + "External id": 444546,"Sequence number": 5285558, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4194304, 1024, 1], [1], [], [4194304, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [1024], [], [16, 4096, 1024], [], [], [], []], "Ev Idx": 6769 + } + }, + { + "ph": "s", "id": 42, "pid": 4183441, "tid": 4183441, "ts": 676007800292.811, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800311.145, "dur": 3.257, + "args": { + "External id": 444547,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800312.478, "dur": 1.785, + "args": { + "External id": 444548,"Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 4183441, "tid": 4183441, + "ts": 676007800318.395, "dur": 4.016, + "args": { + "External id": 444549,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1024, 1]], "Input Dims": [[16, 4096, 1024], [65536, 1024]], "Ev Idx": 6772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800319.720, "dur": 2.583, + "args": { + "External id": 444550,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800321.167, "dur": 1.030, + "args": { + "External id": 444551,"Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007800329.432, "dur": 7.411, + "args": { + "External id": 444552,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007800331.745, "dur": 4.817, + "args": { + "External id": 444553,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007800342.703, "dur": 3.974, + "args": { + "External id": 444554,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007800350.323, "dur": 3.398, + "args": { + "External id": 444555,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800470.917, "dur": 5.288, + "args": { + "External id": 444556,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800471.996, "dur": 3.957, + "args": { + "External id": 444557,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800478.901, "dur": 2.923, + "args": { + "External id": 444558,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800480.395, "dur": 1.231, + "args": { + "External id": 444559,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007800508.778, "dur": 83.211, + "args": { + "External id": 444560,"Sequence number": 5285559, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007800509.993, "dur": 7.595, + "args": { + "External id": 444561,"Sequence number": 5285559, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6784 + } + }, + { + "ph": "s", "id": 41, "pid": 4183441, "tid": 4183441, "ts": 676007800509.993, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007800512.523, "dur": 3.859, + "args": { + "External id": 444562,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007800515.023, "dur": 1.164, + "args": { + "External id": 444563,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007800518.392, "dur": 73.342, + "args": { + "External id": 444564,"Sequence number": 5285560, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800520.107, "dur": 6.112, + "args": { + "External id": 444565,"Sequence number": 5285560, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800521.008, "dur": 5.070, + "args": { + "External id": 444566,"Sequence number": 5285560, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6789 + } + }, + { + "ph": "s", "id": 40, "pid": 4183441, "tid": 4183441, "ts": 676007800521.008, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007800527.341, "dur": 58.349, + "args": { + "External id": 444567,"Sequence number": 5285561, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6790 + } + }, + { + "ph": "s", "id": 39, "pid": 4183441, "tid": 4183441, "ts": 676007800527.341, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007800587.608, "dur": 3.631, + "args": { + "External id": 444568,"Sequence number": 5285562, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6791 + } + }, + { + "ph": "s", "id": 38, "pid": 4183441, "tid": 4183441, "ts": 676007800587.608, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007800598.887, "dur": 111.581, + "args": { + "External id": 444569,"Sequence number": 5285563, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[4194304, 1024, 1], [1024, 1], []], "Input Dims": [[16, 4096, 1024], [2816, 1024], []], "Ev Idx": 6792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007800599.543, "dur": 11.306, + "args": { + "External id": 444570,"Sequence number": 5285563, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[2816, 1024]], "Ev Idx": 6793 + } + }, + { + "ph": "s", "id": 37, "pid": 4183441, "tid": 4183441, "ts": 676007800599.543, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007800604.374, "dur": 5.138, + "args": { + "External id": 444571,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[2816, 1024], [], []], "Ev Idx": 6794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007800608.541, "dur": 0.828, + "args": { + "External id": 444572,"Record function id": 0, "Concrete Inputs": ["", "[1024, 2816]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[2816, 1024], [], [], []], "Ev Idx": 6795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007800611.708, "dur": 98.533, + "args": { + "External id": 444573,"Sequence number": 5285564, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[4194304, 1024, 1], [1, 1024]], "Input Dims": [[16, 4096, 1024], [1024, 2816]], "Ev Idx": 6796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800613.343, "dur": 5.515, + "args": { + "External id": 444574,"Sequence number": 5285564, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800614.314, "dur": 4.382, + "args": { + "External id": 444575,"Sequence number": 5285564, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6798 + } + }, + { + "ph": "s", "id": 36, "pid": 4183441, "tid": 4183441, "ts": 676007800614.314, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007800619.712, "dur": 80.480, + "args": { + "External id": 444576,"Sequence number": 5285565, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[65536, 1024], [1024, 2816]], "Ev Idx": 6799 + } + }, + { + "ph": "s", "id": 35, "pid": 4183441, "tid": 4183441, "ts": 676007800619.712, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007800702.956, "dur": 6.673, + "args": { + "External id": 444577,"Sequence number": 5285566, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2816, 1], []], "Input Dims": [[65536, 2816], []], "Ev Idx": 6800 + } + }, + { + "ph": "s", "id": 34, "pid": 4183441, "tid": 4183441, "ts": 676007800702.956, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007800733.469, "dur": 148.257, + "args": { + "External id": 444578,"Sequence number": 5285567, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6801 + } + }, + { + "ph": "s", "id": 33, "pid": 4183441, "tid": 4183441, "ts": 676007800733.469, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007800771.095, "dur": 5.156, + "args": { + "External id": 444579,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2816]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007800808.327, "dur": 60.797, + "args": { + "External id": 444580,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[11534336, 2816, 1], [2816, 1], []], "Input Dims": [[16, 4096, 2816], [1024, 2816], []], "Ev Idx": 6803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007800809.217, "dur": 5.914, + "args": { + "External id": 444581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2816, 1]], "Input Dims": [[1024, 2816]], "Ev Idx": 6804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007800810.430, "dur": 3.807, + "args": { + "External id": 444582,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2816, 1], [], []], "Input Dims": [[1024, 2816], [], []], "Ev Idx": 6805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007800812.922, "dur": 1.163, + "args": { + "External id": 444583,"Record function id": 0, "Concrete Inputs": ["", "[2816, 1024]", "[1, 2816]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2816, 1], [], [], []], "Input Dims": [[1024, 2816], [], [], []], "Ev Idx": 6806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007800816.301, "dur": 52.468, + "args": { + "External id": 444584,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[11534336, 2816, 1], [1, 2816]], "Input Dims": [[16, 4096, 2816], [2816, 1024]], "Ev Idx": 6807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 4183441, "tid": 4183441, + "ts": 676007800818.029, "dur": 2.819, + "args": { + "External id": 444585,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800819.295, "dur": 1.442, + "args": { + "External id": 444586,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2816]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 2816, 1], []], "Input Dims": [[16, 4096, 2816], []], "Ev Idx": 6809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007800821.486, "dur": 43.597, + "args": { + "External id": 444587,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2816, 1], [1, 2816]], "Input Dims": [[65536, 2816], [2816, 1024]], "Ev Idx": 6810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 4183441, "tid": 4183441, + "ts": 676007800867.019, "dur": 1.164, + "args": { + "External id": 444588,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676007800889.610, "dur": 23.759, + "args": { + "External id": 444589,"Sequence number": 5285568, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4194304, 1024, 1], [4194304, 1024, 1], []], "Input Dims": [[16, 4096, 1024], [16, 4096, 1024], []], "Ev Idx": 6812 + } + }, + { + "ph": "s", "id": 32, "pid": 4183441, "tid": 4183441, "ts": 676007800889.610, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 4183441, "tid": 4183441, + "ts": 676007800931.465, "dur": 45.952, + "args": { + "External id": 444590,"Sequence number": 5285569, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "-2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1]], []], "Input Dims": [[[16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024]], []], "Ev Idx": 6813 + } + }, + { + "ph": "s", "id": 31, "pid": 4183441, "tid": 4183441, "ts": 676007800931.465, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 4183441, "tid": 4183441, + "ts": 676007800939.584, "dur": 32.813, + "args": { + "External id": 444591,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1], [4194304, 1024, 1]], []], "Input Dims": [[[16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024], [16, 4096, 1024]], []], "Ev Idx": 6814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007800974.462, "dur": 1.528, + "args": { + "External id": 444592,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 4096], []], "Ev Idx": 6815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 4183441, "tid": 4183441, + "ts": 676007801013.987, "dur": 49.054, + "args": { + "External id": 444593,"Record function id": 0, "Ev Idx": 6816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 2/0", "pid": 4183441, "tid": 4183441, + "ts": 676007801064.544, "dur": 221.089, + "args": { + "External id": 444594,"Record function id": 0, "Ev Idx": 6817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007801119.384, "dur": 157.805, + "args": { + "External id": 444595,"Sequence number": 5285570, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1], [16777216, 4096, 1024, 1]], "Input Dims": [[1024], [16, 4096, 4, 1024]], "Ev Idx": 6818 + } + }, + { + "ph": "s", "id": 30, "pid": 4183441, "tid": 4183441, "ts": 676007801119.384, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 4183441, "tid": 4183441, + "ts": 676007801193.540, "dur": 42.814, + "args": { + "External id": 444596,"kernel_hash": "cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "1024", "1", "9.9999999999999995e-07", "True", "1024", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/jo/cjoekcioom5xctcdduqst5tzkntyxxejg57p5veuuahm5owqtf73.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 1024], [262144, 1024], [1024], [262144], [], [], [], [], [], [], [], [], []], "Ev Idx": 6819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676007801367.176, "dur": 40.919, + "args": { + "External id": 444597,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007801370.006, "dur": 5.495, + "args": { + "External id": 444598,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007801378.340, "dur": 29.455, + "args": { + "External id": 444599,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007801381.948, "dur": 25.284, + "args": { + "External id": 444600,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 6823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676007801412.202, "dur": 20.098, + "args": { + "External id": 444601,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007801413.583, "dur": 2.997, + "args": { + "External id": 444602,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007801417.488, "dur": 14.538, + "args": { + "External id": 444603,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007801417.976, "dur": 13.622, + "args": { + "External id": 444604,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 6827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676007801435.025, "dur": 21.726, + "args": { + "External id": 444605,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007801435.853, "dur": 2.424, + "args": { + "External id": 444606,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007801439.036, "dur": 17.473, + "args": { + "External id": 444607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007801439.787, "dur": 16.155, + "args": { + "External id": 444608,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 6831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007801465.662, "dur": 0.766, + "args": { + "External id": 444609,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 6832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 4183441, "tid": 4183441, + "ts": 676007801473.955, "dur": 9.572, + "args": { + "External id": 444610,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "5", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 6833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801480.057, "dur": 2.023, + "args": { + "External id": 444611,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 6834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801489.701, "dur": 6.982, + "args": { + "External id": 444612,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 6835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801493.552, "dur": 1.250, + "args": { + "External id": 444613,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 6836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801497.796, "dur": 3.420, + "args": { + "External id": 444614,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 6837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801499.764, "dur": 0.740, + "args": { + "External id": 444615,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 6838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801502.681, "dur": 3.096, + "args": { + "External id": 444616,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 6839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801504.516, "dur": 0.705, + "args": { + "External id": 444617,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 6840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801508.983, "dur": 2.994, + "args": { + "External id": 444618,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 6841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801510.747, "dur": 0.665, + "args": { + "External id": 444619,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 6842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801513.049, "dur": 3.725, + "args": { + "External id": 444620,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 6843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801515.182, "dur": 0.738, + "args": { + "External id": 444621,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 6844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801517.775, "dur": 3.480, + "args": { + "External id": 444622,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4096, 4], [], [], [], []], "Ev Idx": 6845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801519.903, "dur": 0.822, + "args": { + "External id": 444623,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 6846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007801526.005, "dur": 5.842, + "args": { + "External id": 444624,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4096, 4], [], []], "Ev Idx": 6847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801530.433, "dur": 0.680, + "args": { + "External id": 444625,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 6848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801535.621, "dur": 3.212, + "args": { + "External id": 444626,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 6849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801537.527, "dur": 0.732, + "args": { + "External id": 444627,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 6850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007801542.252, "dur": 8.124, + "args": { + "External id": 444628,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 6851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801548.166, "dur": 0.957, + "args": { + "External id": 444629,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 6852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801551.371, "dur": 3.163, + "args": { + "External id": 444630,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 6853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801552.933, "dur": 1.066, + "args": { + "External id": 444631,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 6854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801556.909, "dur": 5.690, + "args": { + "External id": 444632,"Sequence number": 5285571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 6855 + } + }, + { + "ph": "s", "id": 29, "pid": 4183441, "tid": 4183441, "ts": 676007801556.909, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801560.217, "dur": 0.982, + "args": { + "External id": 444633,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 6856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801563.484, "dur": 4.908, + "args": { + "External id": 444634,"Sequence number": 5285572, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 6857 + } + }, + { + "ph": "s", "id": 28, "pid": 4183441, "tid": 4183441, "ts": 676007801563.484, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801567.069, "dur": 0.541, + "args": { + "External id": 444635,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 6858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007801569.305, "dur": 5.685, + "args": { + "External id": 444636,"Sequence number": 5285573, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 6859 + } + }, + { + "ph": "s", "id": 27, "pid": 4183441, "tid": 4183441, "ts": 676007801569.305, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801573.078, "dur": 1.085, + "args": { + "External id": 444637,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 6860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007801576.009, "dur": 4.247, + "args": { + "External id": 444638,"Sequence number": 5285574, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 6861 + } + }, + { + "ph": "s", "id": 26, "pid": 4183441, "tid": 4183441, "ts": 676007801576.009, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801578.675, "dur": 0.863, + "args": { + "External id": 444639,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 6862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007801584.478, "dur": 40.526, + "args": { + "External id": 444640,"Sequence number": 5285575, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 6863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007801586.287, "dur": 38.478, + "args": { + "External id": 444641,"Sequence number": 5285575, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 6864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007801589.178, "dur": 8.178, + "args": { + "External id": 444642,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 6865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007801591.440, "dur": 5.287, + "args": { + "External id": 444643,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007801599.111, "dur": 24.958, + "args": { + "External id": 444644,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 6867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007801650.194, "dur": 42.918, + "args": { + "External id": 444645,"Sequence number": 5285575, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 6868 + } + }, + { + "ph": "s", "id": 25, "pid": 4183441, "tid": 4183441, "ts": 676007801650.194, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007801697.979, "dur": 1.849, + "args": { + "External id": 444646,"Sequence number": 5285576, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 6869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007801727.761, "dur": 21323.984, + "args": { + "External id": 444647,"Sequence number": 5285576, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 6870 + } + }, + { + "ph": "s", "id": 24, "pid": 4183441, "tid": 4183441, "ts": 676007801727.761, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007801742.481, "dur": 36.247, + "args": { + "External id": 444648,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007801743.177, "dur": 35.322, + "args": { + "External id": 444649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007801745.151, "dur": 6.465, + "args": { + "External id": 444650,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007801746.792, "dur": 4.403, + "args": { + "External id": 444651,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007801752.343, "dur": 25.658, + "args": { + "External id": 444652,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 6875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007801794.665, "dur": 37.458, + "args": { + "External id": 444653,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007801803.578, "dur": 7.891, + "args": { + "External id": 444654,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 6877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801806.892, "dur": 4.217, + "args": { + "External id": 444655,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007801812.677, "dur": 19.222, + "args": { + "External id": 444656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 6879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007801813.798, "dur": 17.734, + "args": { + "External id": 444657,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 6880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007801835.895, "dur": 24.180, + "args": { + "External id": 444658,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 6881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007801836.750, "dur": 5.571, + "args": { + "External id": 444659,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 6882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801838.477, "dur": 3.579, + "args": { + "External id": 444660,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007801842.899, "dur": 16.956, + "args": { + "External id": 444661,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007801843.583, "dur": 15.854, + "args": { + "External id": 444662,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 6885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676007801864.747, "dur": 17.487, + "args": { + "External id": 444663,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 6886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007801866.054, "dur": 3.000, + "args": { + "External id": 444664,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007801869.731, "dur": 12.223, + "args": { + "External id": 444665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 6888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007801870.573, "dur": 11.085, + "args": { + "External id": 444666,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 6889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 4183441, + "ts": 676007801889.009, "dur": 27.102, + "args": { + "External id": 444667,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 6890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007801920.367, "dur": 62.681, + "args": { + "External id": 444668,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 6891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007801923.893, "dur": 58.596, + "args": { + "External id": 444669,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801930.297, "dur": 1.288, + "args": { + "External id": 444670,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 6893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007801933.177, "dur": 27.800, + "args": { + "External id": 444671,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007801937.297, "dur": 23.469, + "args": { + "External id": 444672,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 6895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007801940.056, "dur": 2.953, + "args": { + "External id": 444673,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007801943.864, "dur": 16.447, + "args": { + "External id": 444674,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 6897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 4183441, + "ts": 676007801988.182, "dur": 15195.257, + "args": { + "External id": 444675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 6898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 4183441, + "ts": 676007801989.898, "dur": 15192.665, + "args": { + "External id": 444676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 6899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007817195.688, "dur": 6.814, + "args": { + "External id": 444677,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007817199.832, "dur": 1.037, + "args": { + "External id": 444678,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007817207.779, "dur": 112.623, + "args": { + "External id": 444679,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 6902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007817209.678, "dur": 6.999, + "args": { + "External id": 444680,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007817212.072, "dur": 3.685, + "args": { + "External id": 444681,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 6904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007817214.519, "dur": 1.013, + "args": { + "External id": 444682,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 6905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007817217.977, "dur": 101.439, + "args": { + "External id": 444683,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007817220.038, "dur": 98.498, + "args": { + "External id": 444684,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007817323.406, "dur": 4.083, + "args": { + "External id": 444685,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007817325.351, "dur": 0.902, + "args": { + "External id": 444686,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007817336.622, "dur": 4.354, + "args": { + "External id": 444687,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 6910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007817352.246, "dur": 7.173, + "args": { + "External id": 444688,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 6911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007817355.488, "dur": 3.658, + "args": { + "External id": 444689,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007817500.314, "dur": 281.857, + "args": { + "External id": 444690,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007817504.018, "dur": 4.907, + "args": { + "External id": 444691,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007817511.425, "dur": 269.772, + "args": { + "External id": 444692,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 6915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007817514.676, "dur": 0.894, + "args": { + "External id": 444693,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007817518.324, "dur": 29.978, + "args": { + "External id": 444694,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007817550.893, "dur": 6.620, + "args": { + "External id": 444695,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 6918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007817556.409, "dur": 0.773, + "args": { + "External id": 444696,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 6919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007817559.706, "dur": 30.288, + "args": { + "External id": 444697,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007817561.224, "dur": 1.362, + "args": { + "External id": 444698,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007817565.557, "dur": 24.188, + "args": { + "External id": 444699,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 6922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007817570.539, "dur": 3.527, + "args": { + "External id": 444700,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007817592.245, "dur": 25.396, + "args": { + "External id": 444701,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007817621.034, "dur": 18.304, + "args": { + "External id": 444702,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007817643.324, "dur": 50.224, + "args": { + "External id": 444703,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 6926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007817696.799, "dur": 16.385, + "args": { + "External id": 444704,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007817716.719, "dur": 29.107, + "args": { + "External id": 444705,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 6928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007817719.571, "dur": 2.811, + "args": { + "External id": 444706,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007817725.227, "dur": 3.049, + "args": { + "External id": 444707,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 6930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007817748.631, "dur": 16.528, + "args": { + "External id": 444708,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007817767.237, "dur": 12.823, + "args": { + "External id": 444709,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007817790.334, "dur": 2.654, + "args": { + "External id": 444710,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007817800.523, "dur": 4.642, + "args": { + "External id": 444711,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007817803.056, "dur": 0.941, + "args": { + "External id": 444712,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007817892.686, "dur": 66.278, + "args": { + "External id": 444713,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 6936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007817964.831, "dur": 5.638, + "args": { + "External id": 444714,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007817968.217, "dur": 1.076, + "args": { + "External id": 444715,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007817972.277, "dur": 28.964, + "args": { + "External id": 444716,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 6939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007818007.007, "dur": 7.587, + "args": { + "External id": 444717,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 6940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007818009.181, "dur": 4.633, + "args": { + "External id": 444718,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 6941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818011.825, "dur": 1.754, + "args": { + "External id": 444719,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 6942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007818018.611, "dur": 53.893, + "args": { + "External id": 444720,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007818020.367, "dur": 51.602, + "args": { + "External id": 444721,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007818077.984, "dur": 36.418, + "args": { + "External id": 444722,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 6945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007818122.303, "dur": 5.471, + "args": { + "External id": 444723,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818125.462, "dur": 1.239, + "args": { + "External id": 444724,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007818133.028, "dur": 64.751, + "args": { + "External id": 444725,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 6948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007818134.089, "dur": 13.774, + "args": { + "External id": 444726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007818135.354, "dur": 11.855, + "args": { + "External id": 444727,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 6950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818146.290, "dur": 0.730, + "args": { + "External id": 444728,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 6951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007818148.856, "dur": 48.419, + "args": { + "External id": 444729,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007818149.540, "dur": 47.141, + "args": { + "External id": 444730,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007818202.467, "dur": 4.351, + "args": { + "External id": 444731,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818204.728, "dur": 0.905, + "args": { + "External id": 444732,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007818214.031, "dur": 2.075, + "args": { + "External id": 444733,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 6956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007818224.535, "dur": 9.309, + "args": { + "External id": 444734,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 6957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007818226.882, "dur": 6.613, + "args": { + "External id": 444735,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007818332.477, "dur": 267.231, + "args": { + "External id": 444736,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007818334.697, "dur": 2.334, + "args": { + "External id": 444737,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007818338.688, "dur": 260.527, + "args": { + "External id": 444738,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 6961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007818341.075, "dur": 0.402, + "args": { + "External id": 444739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007818342.954, "dur": 32.351, + "args": { + "External id": 444740,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 6963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007818377.754, "dur": 3.191, + "args": { + "External id": 444741,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 6964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818379.827, "dur": 0.780, + "args": { + "External id": 444742,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 6965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007818382.710, "dur": 30.478, + "args": { + "External id": 444743,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007818384.190, "dur": 1.918, + "args": { + "External id": 444744,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007818387.657, "dur": 25.075, + "args": { + "External id": 444745,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 6968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007818392.911, "dur": 2.985, + "args": { + "External id": 444746,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007818414.957, "dur": 38.691, + "args": { + "External id": 444747,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007818455.765, "dur": 39.042, + "args": { + "External id": 444748,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007818497.934, "dur": 26.751, + "args": { + "External id": 444749,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 6972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007818526.468, "dur": 21.359, + "args": { + "External id": 444750,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 6973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007818549.964, "dur": 22.151, + "args": { + "External id": 444751,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 6974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007818551.872, "dur": 2.245, + "args": { + "External id": 444752,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 6975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818556.687, "dur": 0.962, + "args": { + "External id": 444753,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 6976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007818574.439, "dur": 11.612, + "args": { + "External id": 444754,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 6977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007818587.398, "dur": 10.922, + "args": { + "External id": 444755,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 6978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007818605.795, "dur": 1.953, + "args": { + "External id": 444756,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 6979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007818616.031, "dur": 3.408, + "args": { + "External id": 444757,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 6980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818618.048, "dur": 0.532, + "args": { + "External id": 444758,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 6981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007818741.958, "dur": 51.898, + "args": { + "External id": 444759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 6982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007818799.404, "dur": 7.122, + "args": { + "External id": 444760,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818803.402, "dur": 1.585, + "args": { + "External id": 444761,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007818808.080, "dur": 25.476, + "args": { + "External id": 444762,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 6985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007818838.622, "dur": 12.576, + "args": { + "External id": 444763,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 6986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007818846.527, "dur": 3.988, + "args": { + "External id": 444764,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 6987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818849.090, "dur": 1.195, + "args": { + "External id": 444765,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 6988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007818854.014, "dur": 43.690, + "args": { + "External id": 444766,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007818855.762, "dur": 41.275, + "args": { + "External id": 444767,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 6990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007818901.432, "dur": 15.101, + "args": { + "External id": 444768,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 6991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007818922.188, "dur": 4.486, + "args": { + "External id": 444769,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 6992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818924.852, "dur": 0.855, + "args": { + "External id": 444770,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 6993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007818931.130, "dur": 51.869, + "args": { + "External id": 444771,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 6994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007818932.063, "dur": 6.396, + "args": { + "External id": 444772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 6995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007818933.076, "dur": 4.765, + "args": { + "External id": 444773,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 6996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818934.686, "dur": 2.954, + "args": { + "External id": 444774,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 6997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007818939.728, "dur": 42.710, + "args": { + "External id": 444775,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007818940.706, "dur": 41.278, + "args": { + "External id": 444776,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 6999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007818987.543, "dur": 4.302, + "args": { + "External id": 444777,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007818989.724, "dur": 0.949, + "args": { + "External id": 444778,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007818998.345, "dur": 1.662, + "args": { + "External id": 444779,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819008.939, "dur": 6.158, + "args": { + "External id": 444780,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819011.076, "dur": 3.737, + "args": { + "External id": 444781,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007819124.840, "dur": 193.713, + "args": { + "External id": 444782,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819127.681, "dur": 3.345, + "args": { + "External id": 444783,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007819132.919, "dur": 185.100, + "args": { + "External id": 444784,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007819134.442, "dur": 0.346, + "args": { + "External id": 444785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007819139.261, "dur": 22.005, + "args": { + "External id": 444786,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007819163.265, "dur": 4.179, + "args": { + "External id": 444787,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819165.675, "dur": 1.471, + "args": { + "External id": 444788,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007819168.734, "dur": 24.133, + "args": { + "External id": 444789,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819169.815, "dur": 3.360, + "args": { + "External id": 444790,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007819174.975, "dur": 17.542, + "args": { + "External id": 444791,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007819178.595, "dur": 2.706, + "args": { + "External id": 444792,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007819194.572, "dur": 20.642, + "args": { + "External id": 444793,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007819217.212, "dur": 18.739, + "args": { + "External id": 444794,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007819238.813, "dur": 16.849, + "args": { + "External id": 444795,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007819257.412, "dur": 11.749, + "args": { + "External id": 444796,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007819271.261, "dur": 20.208, + "args": { + "External id": 444797,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007819273.285, "dur": 1.644, + "args": { + "External id": 444798,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819277.523, "dur": 0.963, + "args": { + "External id": 444799,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007819293.380, "dur": 12.049, + "args": { + "External id": 444800,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007819306.694, "dur": 10.226, + "args": { + "External id": 444801,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007819324.846, "dur": 2.080, + "args": { + "External id": 444802,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007819336.158, "dur": 3.834, + "args": { + "External id": 444803,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819338.667, "dur": 0.410, + "args": { + "External id": 444804,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007819407.529, "dur": 46.577, + "args": { + "External id": 444805,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007819459.358, "dur": 5.126, + "args": { + "External id": 444806,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819462.298, "dur": 0.918, + "args": { + "External id": 444807,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007819466.198, "dur": 24.986, + "args": { + "External id": 444808,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007819495.784, "dur": 7.305, + "args": { + "External id": 444809,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007819497.410, "dur": 4.989, + "args": { + "External id": 444810,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819499.632, "dur": 2.486, + "args": { + "External id": 444811,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007819505.924, "dur": 42.939, + "args": { + "External id": 444812,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007819507.296, "dur": 40.822, + "args": { + "External id": 444813,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007819552.973, "dur": 14.082, + "args": { + "External id": 444814,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007819572.294, "dur": 4.491, + "args": { + "External id": 444815,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819574.935, "dur": 0.966, + "args": { + "External id": 444816,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007819580.527, "dur": 47.701, + "args": { + "External id": 444817,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007819581.919, "dur": 3.946, + "args": { + "External id": 444818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007819582.631, "dur": 2.652, + "args": { + "External id": 444819,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819584.384, "dur": 0.754, + "args": { + "External id": 444820,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007819586.604, "dur": 41.290, + "args": { + "External id": 444821,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007819587.509, "dur": 39.745, + "args": { + "External id": 444822,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007819632.124, "dur": 3.757, + "args": { + "External id": 444823,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819634.000, "dur": 0.781, + "args": { + "External id": 444824,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007819641.486, "dur": 1.373, + "args": { + "External id": 444825,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819650.400, "dur": 46.579, + "args": { + "External id": 444826,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819690.927, "dur": 5.524, + "args": { + "External id": 444827,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007819795.042, "dur": 187.819, + "args": { + "External id": 444828,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819797.524, "dur": 2.651, + "args": { + "External id": 444829,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007819804.571, "dur": 177.824, + "args": { + "External id": 444830,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007819806.094, "dur": 0.291, + "args": { + "External id": 444831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007819807.884, "dur": 21.747, + "args": { + "External id": 444832,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007819831.415, "dur": 5.648, + "args": { + "External id": 444833,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819833.737, "dur": 2.808, + "args": { + "External id": 444834,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007819838.381, "dur": 22.769, + "args": { + "External id": 444835,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007819839.524, "dur": 2.181, + "args": { + "External id": 444836,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007819843.230, "dur": 17.678, + "args": { + "External id": 444837,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007819846.435, "dur": 2.891, + "args": { + "External id": 444838,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007819863.182, "dur": 21.612, + "args": { + "External id": 444839,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007819886.374, "dur": 12.428, + "args": { + "External id": 444840,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007819902.400, "dur": 14.319, + "args": { + "External id": 444841,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007819918.323, "dur": 11.326, + "args": { + "External id": 444842,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007819931.425, "dur": 22.411, + "args": { + "External id": 444843,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007819933.849, "dur": 1.984, + "args": { + "External id": 444844,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007819938.438, "dur": 2.772, + "args": { + "External id": 444845,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007819956.181, "dur": 11.521, + "args": { + "External id": 444846,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007819968.772, "dur": 12.456, + "args": { + "External id": 444847,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007819989.103, "dur": 2.491, + "args": { + "External id": 444848,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820001.240, "dur": 4.396, + "args": { + "External id": 444849,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820003.807, "dur": 0.523, + "args": { + "External id": 444850,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007820069.096, "dur": 67.630, + "args": { + "External id": 444851,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820143.195, "dur": 6.092, + "args": { + "External id": 444852,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820146.669, "dur": 1.225, + "args": { + "External id": 444853,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007820150.668, "dur": 26.449, + "args": { + "External id": 444854,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007820182.597, "dur": 6.573, + "args": { + "External id": 444855,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007820184.245, "dur": 4.185, + "args": { + "External id": 444856,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820186.410, "dur": 1.804, + "args": { + "External id": 444857,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007820192.461, "dur": 44.678, + "args": { + "External id": 444858,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007820193.863, "dur": 42.577, + "args": { + "External id": 444859,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007820240.820, "dur": 16.528, + "args": { + "External id": 444860,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820262.845, "dur": 4.353, + "args": { + "External id": 444861,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820265.212, "dur": 1.087, + "args": { + "External id": 444862,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007820271.484, "dur": 48.280, + "args": { + "External id": 444863,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007820272.374, "dur": 4.494, + "args": { + "External id": 444864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007820273.514, "dur": 2.762, + "args": { + "External id": 444865,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820275.309, "dur": 0.816, + "args": { + "External id": 444866,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007820277.678, "dur": 41.726, + "args": { + "External id": 444867,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007820278.633, "dur": 40.216, + "args": { + "External id": 444868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820323.675, "dur": 4.146, + "args": { + "External id": 444869,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820325.619, "dur": 0.961, + "args": { + "External id": 444870,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007820333.904, "dur": 1.591, + "args": { + "External id": 444871,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007820343.987, "dur": 7.150, + "args": { + "External id": 444872,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007820346.448, "dur": 4.372, + "args": { + "External id": 444873,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007820434.310, "dur": 189.062, + "args": { + "External id": 444874,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007820439.222, "dur": 2.064, + "args": { + "External id": 444875,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007820442.784, "dur": 180.106, + "args": { + "External id": 444876,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007820444.317, "dur": 0.373, + "args": { + "External id": 444877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007820445.950, "dur": 21.992, + "args": { + "External id": 444878,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007820469.591, "dur": 5.645, + "args": { + "External id": 444879,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820474.013, "dur": 0.910, + "args": { + "External id": 444880,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007820476.547, "dur": 22.391, + "args": { + "External id": 444881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007820477.904, "dur": 1.565, + "args": { + "External id": 444882,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007820480.982, "dur": 17.699, + "args": { + "External id": 444883,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007820483.839, "dur": 2.322, + "args": { + "External id": 444884,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007820500.332, "dur": 21.026, + "args": { + "External id": 444885,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007820523.002, "dur": 14.662, + "args": { + "External id": 444886,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007820540.341, "dur": 13.664, + "args": { + "External id": 444887,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007820555.978, "dur": 14.086, + "args": { + "External id": 444888,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007820571.976, "dur": 22.581, + "args": { + "External id": 444889,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007820576.065, "dur": 1.316, + "args": { + "External id": 444890,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820579.896, "dur": 0.620, + "args": { + "External id": 444891,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007820596.403, "dur": 13.700, + "args": { + "External id": 444892,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007820611.269, "dur": 10.590, + "args": { + "External id": 444893,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007820629.174, "dur": 1.630, + "args": { + "External id": 444894,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820687.382, "dur": 6.385, + "args": { + "External id": 444895,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820691.332, "dur": 0.863, + "args": { + "External id": 444896,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007820767.203, "dur": 49.044, + "args": { + "External id": 444897,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820821.907, "dur": 5.229, + "args": { + "External id": 444898,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820825.049, "dur": 0.943, + "args": { + "External id": 444899,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007820828.815, "dur": 26.503, + "args": { + "External id": 444900,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007820859.698, "dur": 8.820, + "args": { + "External id": 444901,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007820861.771, "dur": 6.078, + "args": { + "External id": 444902,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820864.091, "dur": 3.522, + "args": { + "External id": 444903,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007820871.596, "dur": 44.073, + "args": { + "External id": 444904,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007820873.103, "dur": 41.849, + "args": { + "External id": 444905,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007820919.294, "dur": 15.506, + "args": { + "External id": 444906,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820939.564, "dur": 4.212, + "args": { + "External id": 444907,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820942.086, "dur": 0.846, + "args": { + "External id": 444908,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007820947.489, "dur": 48.381, + "args": { + "External id": 444909,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007820948.478, "dur": 4.558, + "args": { + "External id": 444910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007820949.413, "dur": 3.078, + "args": { + "External id": 444911,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007820951.054, "dur": 1.293, + "args": { + "External id": 444912,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007820953.642, "dur": 41.897, + "args": { + "External id": 444913,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007820954.646, "dur": 40.180, + "args": { + "External id": 444914,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007820999.723, "dur": 3.860, + "args": { + "External id": 444915,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821001.717, "dur": 0.818, + "args": { + "External id": 444916,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007821009.602, "dur": 1.569, + "args": { + "External id": 444917,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821018.689, "dur": 6.539, + "args": { + "External id": 444918,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821020.680, "dur": 4.253, + "args": { + "External id": 444919,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007821127.573, "dur": 265.543, + "args": { + "External id": 444920,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821129.970, "dur": 2.907, + "args": { + "External id": 444921,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007821136.809, "dur": 255.816, + "args": { + "External id": 444922,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007821138.545, "dur": 0.427, + "args": { + "External id": 444923,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007821140.075, "dur": 41.836, + "args": { + "External id": 444924,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007821184.565, "dur": 6.207, + "args": { + "External id": 444925,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821186.750, "dur": 3.737, + "args": { + "External id": 444926,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007821192.513, "dur": 53.182, + "args": { + "External id": 444927,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821193.994, "dur": 2.166, + "args": { + "External id": 444928,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007821224.064, "dur": 21.369, + "args": { + "External id": 444929,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007821227.717, "dur": 2.784, + "args": { + "External id": 444930,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007821247.477, "dur": 27.566, + "args": { + "External id": 444931,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007821276.831, "dur": 26.159, + "args": { + "External id": 444932,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007821305.881, "dur": 16.287, + "args": { + "External id": 444933,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007821323.898, "dur": 12.998, + "args": { + "External id": 444934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007821338.900, "dur": 24.878, + "args": { + "External id": 444935,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007821343.321, "dur": 2.073, + "args": { + "External id": 444936,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821347.790, "dur": 0.868, + "args": { + "External id": 444937,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007821365.832, "dur": 12.913, + "args": { + "External id": 444938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007821380.076, "dur": 11.654, + "args": { + "External id": 444939,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007821400.871, "dur": 2.114, + "args": { + "External id": 444940,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007821412.489, "dur": 4.022, + "args": { + "External id": 444941,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821415.056, "dur": 0.483, + "args": { + "External id": 444942,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007821485.023, "dur": 48.642, + "args": { + "External id": 444943,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007821538.509, "dur": 4.782, + "args": { + "External id": 444944,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821541.180, "dur": 1.010, + "args": { + "External id": 444945,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007821544.772, "dur": 23.866, + "args": { + "External id": 444946,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007821572.770, "dur": 5.892, + "args": { + "External id": 444947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007821574.277, "dur": 3.747, + "args": { + "External id": 444948,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821576.413, "dur": 1.420, + "args": { + "External id": 444949,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007821581.645, "dur": 41.691, + "args": { + "External id": 444950,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007821582.695, "dur": 39.815, + "args": { + "External id": 444951,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007821627.006, "dur": 16.038, + "args": { + "External id": 444952,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007821648.133, "dur": 46.411, + "args": { + "External id": 444953,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821691.294, "dur": 1.465, + "args": { + "External id": 444954,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007821700.583, "dur": 56.564, + "args": { + "External id": 444955,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007821701.909, "dur": 5.400, + "args": { + "External id": 444956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007821703.241, "dur": 3.455, + "args": { + "External id": 444957,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821705.260, "dur": 1.295, + "args": { + "External id": 444958,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007821708.241, "dur": 48.538, + "args": { + "External id": 444959,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007821709.435, "dur": 46.777, + "args": { + "External id": 444960,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007821761.926, "dur": 3.809, + "args": { + "External id": 444961,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821764.074, "dur": 0.578, + "args": { + "External id": 444962,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007821772.843, "dur": 1.769, + "args": { + "External id": 444963,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821783.209, "dur": 6.239, + "args": { + "External id": 444964,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821785.498, "dur": 3.681, + "args": { + "External id": 444965,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007821871.818, "dur": 191.407, + "args": { + "External id": 444966,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821876.225, "dur": 2.388, + "args": { + "External id": 444967,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007821880.639, "dur": 182.016, + "args": { + "External id": 444968,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007821882.465, "dur": 0.383, + "args": { + "External id": 444969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007821884.439, "dur": 21.530, + "args": { + "External id": 444970,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007821907.935, "dur": 5.209, + "args": { + "External id": 444971,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007821911.904, "dur": 0.920, + "args": { + "External id": 444972,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007821914.444, "dur": 20.182, + "args": { + "External id": 444973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007821915.715, "dur": 1.388, + "args": { + "External id": 444974,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007821918.613, "dur": 15.750, + "args": { + "External id": 444975,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007821921.253, "dur": 2.458, + "args": { + "External id": 444976,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007821936.341, "dur": 20.356, + "args": { + "External id": 444977,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007821958.230, "dur": 16.139, + "args": { + "External id": 444978,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007821983.773, "dur": 17.640, + "args": { + "External id": 444979,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007822002.844, "dur": 12.498, + "args": { + "External id": 444980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007822017.418, "dur": 19.452, + "args": { + "External id": 444981,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007822019.587, "dur": 1.516, + "args": { + "External id": 444982,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822023.425, "dur": 1.265, + "args": { + "External id": 444983,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007822038.924, "dur": 11.172, + "args": { + "External id": 444984,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007822051.499, "dur": 10.256, + "args": { + "External id": 444985,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007822069.153, "dur": 1.730, + "args": { + "External id": 444986,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007822079.254, "dur": 20.483, + "args": { + "External id": 444987,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822097.243, "dur": 0.876, + "args": { + "External id": 444988,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007822167.569, "dur": 44.098, + "args": { + "External id": 444989,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007822216.700, "dur": 4.890, + "args": { + "External id": 444990,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822219.570, "dur": 0.912, + "args": { + "External id": 444991,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007822223.034, "dur": 22.016, + "args": { + "External id": 444992,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007822249.230, "dur": 8.368, + "args": { + "External id": 444993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007822251.154, "dur": 5.818, + "args": { + "External id": 444994,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822253.292, "dur": 3.469, + "args": { + "External id": 444995,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007822260.602, "dur": 39.475, + "args": { + "External id": 444996,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007822261.797, "dur": 37.421, + "args": { + "External id": 444997,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007822303.960, "dur": 14.494, + "args": { + "External id": 444998,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007822323.259, "dur": 4.371, + "args": { + "External id": 444999,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822325.716, "dur": 0.991, + "args": { + "External id": 445000,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007822331.395, "dur": 46.158, + "args": { + "External id": 445001,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007822332.414, "dur": 4.449, + "args": { + "External id": 445002,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007822333.326, "dur": 2.890, + "args": { + "External id": 445003,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822335.286, "dur": 0.806, + "args": { + "External id": 445004,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007822337.594, "dur": 39.636, + "args": { + "External id": 445005,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007822338.593, "dur": 38.072, + "args": { + "External id": 445006,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007822381.456, "dur": 3.571, + "args": { + "External id": 445007,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822383.498, "dur": 0.538, + "args": { + "External id": 445008,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007822390.846, "dur": 1.478, + "args": { + "External id": 445009,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007822399.416, "dur": 6.682, + "args": { + "External id": 445010,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007822401.523, "dur": 4.298, + "args": { + "External id": 445011,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007822477.625, "dur": 173.404, + "args": { + "External id": 445012,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007822479.658, "dur": 2.283, + "args": { + "External id": 445013,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007822485.971, "dur": 164.639, + "args": { + "External id": 445014,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007822487.069, "dur": 0.539, + "args": { + "External id": 445015,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007822488.846, "dur": 19.984, + "args": { + "External id": 445016,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007822510.430, "dur": 5.345, + "args": { + "External id": 445017,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822512.151, "dur": 3.359, + "args": { + "External id": 445018,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007822517.192, "dur": 22.384, + "args": { + "External id": 445019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007822518.516, "dur": 1.413, + "args": { + "External id": 445020,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007822521.445, "dur": 17.867, + "args": { + "External id": 445021,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007822523.968, "dur": 2.293, + "args": { + "External id": 445022,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007822541.142, "dur": 19.848, + "args": { + "External id": 445023,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007822562.127, "dur": 12.774, + "args": { + "External id": 445024,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007822578.081, "dur": 12.446, + "args": { + "External id": 445025,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007822591.892, "dur": 10.793, + "args": { + "External id": 445026,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007822604.443, "dur": 20.931, + "args": { + "External id": 445027,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007822606.191, "dur": 2.093, + "args": { + "External id": 445028,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822610.668, "dur": 2.606, + "args": { + "External id": 445029,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007822626.983, "dur": 11.028, + "args": { + "External id": 445030,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007822639.209, "dur": 10.406, + "args": { + "External id": 445031,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007822694.392, "dur": 2.502, + "args": { + "External id": 445032,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007822706.919, "dur": 3.757, + "args": { + "External id": 445033,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822709.192, "dur": 0.493, + "args": { + "External id": 445034,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007822780.041, "dur": 47.739, + "args": { + "External id": 445035,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007822832.096, "dur": 4.996, + "args": { + "External id": 445036,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822835.031, "dur": 0.948, + "args": { + "External id": 445037,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007822838.163, "dur": 26.251, + "args": { + "External id": 445038,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007822868.536, "dur": 6.445, + "args": { + "External id": 445039,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007822870.169, "dur": 4.126, + "args": { + "External id": 445040,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822872.288, "dur": 1.731, + "args": { + "External id": 445041,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007822877.224, "dur": 42.465, + "args": { + "External id": 445042,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007822879.055, "dur": 40.002, + "args": { + "External id": 445043,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007822923.391, "dur": 14.972, + "args": { + "External id": 445044,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007822943.425, "dur": 25.065, + "args": { + "External id": 445045,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007822946.108, "dur": 21.989, + "args": { + "External id": 445046,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822951.676, "dur": 1.336, + "args": { + "External id": 445047,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007822974.460, "dur": 27.454, + "args": { + "External id": 445048,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007822976.537, "dur": 25.155, + "args": { + "External id": 445049,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 7272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007822982.163, "dur": 4.122, + "args": { + "External id": 445050,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007822987.502, "dur": 13.726, + "args": { + "External id": 445051,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007823017.387, "dur": 6.526, + "args": { + "External id": 445052,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007823020.220, "dur": 3.379, + "args": { + "External id": 445053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007823024.861, "dur": 1.698, + "args": { + "External id": 445054,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007823025.968, "dur": 0.516, + "args": { + "External id": 445055,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007823070.648, "dur": 41.671, + "args": { + "External id": 445056,"Sequence number": 5285577, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 7279 + } + }, + { + "ph": "s", "id": 23, "pid": 4183441, "tid": 4183441, "ts": 676007823070.648, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007823119.689, "dur": 7.199, + "args": { + "External id": 445057,"Sequence number": 5285578, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 7280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823123.692, "dur": 1.616, + "args": { + "External id": 445058,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007823129.470, "dur": 6.357, + "args": { + "External id": 445059,"Sequence number": 5285578, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "1"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 7282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823133.825, "dur": 0.902, + "args": { + "External id": 445060,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007823137.070, "dur": 2.737, + "args": { + "External id": 445061,"Sequence number": 5285578, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 7284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823138.760, "dur": 0.498, + "args": { + "External id": 445062,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 7285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007823144.071, "dur": 6.882, + "args": { + "External id": 445063,"Sequence number": 5285578, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7286 + } + }, + { + "ph": "s", "id": 22, "pid": 4183441, "tid": 4183441, "ts": 676007823144.071, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823148.010, "dur": 1.427, + "args": { + "External id": 445064,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007823151.916, "dur": 5.303, + "args": { + "External id": 445065,"Sequence number": 5285579, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7288 + } + }, + { + "ph": "s", "id": 21, "pid": 4183441, "tid": 4183441, "ts": 676007823151.916, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823155.574, "dur": 0.865, + "args": { + "External id": 445066,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007823158.584, "dur": 5.666, + "args": { + "External id": 445067,"Sequence number": 5285580, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 7290 + } + }, + { + "ph": "s", "id": 20, "pid": 4183441, "tid": 4183441, "ts": 676007823158.584, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823162.564, "dur": 0.566, + "args": { + "External id": 445068,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007823165.277, "dur": 4.748, + "args": { + "External id": 445069,"Sequence number": 5285581, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 7292 + } + }, + { + "ph": "s", "id": 19, "pid": 4183441, "tid": 4183441, "ts": 676007823165.277, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823168.151, "dur": 1.116, + "args": { + "External id": 445070,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "1024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 7293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007823174.561, "dur": 31.795, + "args": { + "External id": 445071,"Sequence number": 5285582, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007823176.229, "dur": 29.917, + "args": { + "External id": 445072,"Sequence number": 5285582, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007823179.107, "dur": 7.732, + "args": { + "External id": 445073,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 7296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007823181.547, "dur": 4.741, + "args": { + "External id": 445074,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007823188.222, "dur": 17.492, + "args": { + "External id": 445075,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 7298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007823233.617, "dur": 5.938, + "args": { + "External id": 445076,"Sequence number": 5285582, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 7299 + } + }, + { + "ph": "s", "id": 18, "pid": 4183441, "tid": 4183441, "ts": 676007823233.617, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007823242.043, "dur": 0.911, + "args": { + "External id": 445077,"Sequence number": 5285583, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007823275.100, "dur": 22316.244, + "args": { + "External id": 445078,"Sequence number": 5285583, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 7301 + } + }, + { + "ph": "s", "id": 17, "pid": 4183441, "tid": 4183441, "ts": 676007823275.100, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007823290.102, "dur": 24.209, + "args": { + "External id": 445079,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007823290.888, "dur": 23.202, + "args": { + "External id": 445080,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007823292.150, "dur": 5.388, + "args": { + "External id": 445081,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007823293.525, "dur": 3.633, + "args": { + "External id": 445082,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007823298.278, "dur": 15.359, + "args": { + "External id": 445083,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 7306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007823329.089, "dur": 24.695, + "args": { + "External id": 445084,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007823330.002, "dur": 6.188, + "args": { + "External id": 445085,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823332.394, "dur": 3.442, + "args": { + "External id": 445086,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007823337.651, "dur": 15.926, + "args": { + "External id": 445087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007823339.534, "dur": 13.646, + "args": { + "External id": 445088,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007823357.206, "dur": 20.529, + "args": { + "External id": 445089,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007823357.991, "dur": 5.802, + "args": { + "External id": 445090,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823360.123, "dur": 3.420, + "args": { + "External id": 445091,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007823364.504, "dur": 13.032, + "args": { + "External id": 445092,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007823365.503, "dur": 11.670, + "args": { + "External id": 445093,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 7316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676007823383.613, "dur": 20.292, + "args": { + "External id": 445094,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 7317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007823388.078, "dur": 3.239, + "args": { + "External id": 445095,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007823391.938, "dur": 11.713, + "args": { + "External id": 445096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 7319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007823392.691, "dur": 10.589, + "args": { + "External id": 445097,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 4183441, + "ts": 676007823409.055, "dur": 22.217, + "args": { + "External id": 445098,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007823434.019, "dur": 49.233, + "args": { + "External id": 445099,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007823435.725, "dur": 47.055, + "args": { + "External id": 445100,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823439.727, "dur": 1.132, + "args": { + "External id": 445101,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007823442.015, "dur": 24.065, + "args": { + "External id": 445102,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007823443.670, "dur": 22.202, + "args": { + "External id": 445103,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 7326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007823447.975, "dur": 2.938, + "args": { + "External id": 445104,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007823451.611, "dur": 13.888, + "args": { + "External id": 445105,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 7328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 4183441, + "ts": 676007823487.163, "dur": 16369.355, + "args": { + "External id": 445106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 4183441, + "ts": 676007823488.629, "dur": 16364.467, + "args": { + "External id": 445107,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007839875.801, "dur": 10.906, + "args": { + "External id": 445108,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007839882.343, "dur": 1.753, + "args": { + "External id": 445109,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007839892.747, "dur": 117.068, + "args": { + "External id": 445110,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007839894.803, "dur": 7.757, + "args": { + "External id": 445111,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007839897.487, "dur": 4.217, + "args": { + "External id": 445112,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007839900.045, "dur": 1.366, + "args": { + "External id": 445113,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007839903.788, "dur": 105.195, + "args": { + "External id": 445114,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007839906.097, "dur": 102.038, + "args": { + "External id": 445115,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007840013.770, "dur": 4.317, + "args": { + "External id": 445116,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840015.724, "dur": 0.883, + "args": { + "External id": 445117,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007840027.744, "dur": 3.293, + "args": { + "External id": 445118,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840043.432, "dur": 8.234, + "args": { + "External id": 445119,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840046.292, "dur": 5.076, + "args": { + "External id": 445120,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007840194.005, "dur": 235.682, + "args": { + "External id": 445121,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840197.537, "dur": 3.094, + "args": { + "External id": 445122,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007840204.707, "dur": 224.421, + "args": { + "External id": 445123,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007840207.062, "dur": 0.643, + "args": { + "External id": 445124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007840209.309, "dur": 29.480, + "args": { + "External id": 445125,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007840241.306, "dur": 6.038, + "args": { + "External id": 445126,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840243.911, "dur": 3.046, + "args": { + "External id": 445127,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007840248.730, "dur": 40.545, + "args": { + "External id": 445128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840263.217, "dur": 1.582, + "args": { + "External id": 445129,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007840266.782, "dur": 22.158, + "args": { + "External id": 445130,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007840271.920, "dur": 3.295, + "args": { + "External id": 445131,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007840291.235, "dur": 24.855, + "args": { + "External id": 445132,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007840318.034, "dur": 19.590, + "args": { + "External id": 445133,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007840341.103, "dur": 16.655, + "args": { + "External id": 445134,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007840359.707, "dur": 14.735, + "args": { + "External id": 445135,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007840376.685, "dur": 22.683, + "args": { + "External id": 445136,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007840378.849, "dur": 1.752, + "args": { + "External id": 445137,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840383.530, "dur": 1.001, + "args": { + "External id": 445138,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007840401.389, "dur": 13.331, + "args": { + "External id": 445139,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007840416.528, "dur": 11.666, + "args": { + "External id": 445140,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007840437.374, "dur": 2.601, + "args": { + "External id": 445141,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007840447.554, "dur": 4.787, + "args": { + "External id": 445142,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840450.532, "dur": 0.868, + "args": { + "External id": 445143,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007840522.347, "dur": 58.905, + "args": { + "External id": 445144,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007840586.365, "dur": 7.039, + "args": { + "External id": 445145,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840589.169, "dur": 1.399, + "args": { + "External id": 445146,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007840594.955, "dur": 26.760, + "args": { + "External id": 445147,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007840626.406, "dur": 7.856, + "args": { + "External id": 445148,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007840628.870, "dur": 4.575, + "args": { + "External id": 445149,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840631.556, "dur": 1.626, + "args": { + "External id": 445150,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007840637.269, "dur": 87.320, + "args": { + "External id": 445151,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007840638.895, "dur": 84.236, + "args": { + "External id": 445152,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007840730.635, "dur": 18.930, + "args": { + "External id": 445153,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007840756.135, "dur": 4.817, + "args": { + "External id": 445154,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840758.900, "dur": 0.932, + "args": { + "External id": 445155,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007840765.883, "dur": 54.028, + "args": { + "External id": 445156,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007840767.059, "dur": 4.781, + "args": { + "External id": 445157,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007840768.245, "dur": 3.008, + "args": { + "External id": 445158,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840770.227, "dur": 0.847, + "args": { + "External id": 445159,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007840773.041, "dur": 46.530, + "args": { + "External id": 445160,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007840774.124, "dur": 45.027, + "args": { + "External id": 445161,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007840824.091, "dur": 4.127, + "args": { + "External id": 445162,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840825.972, "dur": 0.971, + "args": { + "External id": 445163,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007840834.972, "dur": 2.279, + "args": { + "External id": 445164,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840846.117, "dur": 8.556, + "args": { + "External id": 445165,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840848.777, "dur": 5.573, + "args": { + "External id": 445166,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007840946.534, "dur": 331.005, + "args": { + "External id": 445167,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840948.519, "dur": 1.961, + "args": { + "External id": 445168,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007840952.254, "dur": 324.791, + "args": { + "External id": 445169,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007840954.401, "dur": 0.466, + "args": { + "External id": 445170,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007840956.392, "dur": 24.742, + "args": { + "External id": 445171,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007840983.062, "dur": 3.447, + "args": { + "External id": 445172,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007840985.169, "dur": 0.828, + "args": { + "External id": 445173,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007840987.869, "dur": 26.438, + "args": { + "External id": 445174,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007840989.139, "dur": 1.710, + "args": { + "External id": 445175,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007840992.423, "dur": 21.603, + "args": { + "External id": 445176,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007840997.546, "dur": 2.823, + "args": { + "External id": 445177,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007841015.883, "dur": 26.277, + "args": { + "External id": 445178,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007841043.771, "dur": 52.965, + "args": { + "External id": 445179,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007841100.970, "dur": 34.614, + "args": { + "External id": 445180,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007841137.193, "dur": 41.662, + "args": { + "External id": 445181,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007841181.071, "dur": 40.371, + "args": { + "External id": 445182,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007841183.579, "dur": 2.203, + "args": { + "External id": 445183,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841188.630, "dur": 0.849, + "args": { + "External id": 445184,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007841223.579, "dur": 25.839, + "args": { + "External id": 445185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007841250.590, "dur": 25.512, + "args": { + "External id": 445186,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007841284.989, "dur": 2.481, + "args": { + "External id": 445187,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007841296.625, "dur": 3.880, + "args": { + "External id": 445188,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841299.106, "dur": 0.612, + "args": { + "External id": 445189,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007841368.028, "dur": 48.603, + "args": { + "External id": 445190,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007841421.364, "dur": 5.772, + "args": { + "External id": 445191,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841424.713, "dur": 1.444, + "args": { + "External id": 445192,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007841428.399, "dur": 23.158, + "args": { + "External id": 445193,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007841456.206, "dur": 5.905, + "args": { + "External id": 445194,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007841457.862, "dur": 3.549, + "args": { + "External id": 445195,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841460.190, "dur": 1.036, + "args": { + "External id": 445196,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007841464.667, "dur": 41.563, + "args": { + "External id": 445197,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007841466.035, "dur": 39.660, + "args": { + "External id": 445198,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007841509.655, "dur": 13.383, + "args": { + "External id": 445199,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007841528.049, "dur": 4.548, + "args": { + "External id": 445200,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841530.724, "dur": 1.093, + "args": { + "External id": 445201,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007841536.460, "dur": 65.093, + "args": { + "External id": 445202,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007841537.667, "dur": 6.441, + "args": { + "External id": 445203,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007841538.805, "dur": 4.749, + "args": { + "External id": 445204,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841540.757, "dur": 2.573, + "args": { + "External id": 445205,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007841558.709, "dur": 42.390, + "args": { + "External id": 445206,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007841559.622, "dur": 40.953, + "args": { + "External id": 445207,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007841605.444, "dur": 4.364, + "args": { + "External id": 445208,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841607.701, "dur": 0.931, + "args": { + "External id": 445209,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007841614.966, "dur": 1.852, + "args": { + "External id": 445210,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007841625.225, "dur": 6.366, + "args": { + "External id": 445211,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007841627.165, "dur": 4.158, + "args": { + "External id": 445212,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007841754.078, "dur": 194.675, + "args": { + "External id": 445213,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007841758.906, "dur": 3.156, + "args": { + "External id": 445214,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007841763.755, "dur": 184.532, + "args": { + "External id": 445215,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007841765.764, "dur": 0.625, + "args": { + "External id": 445216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007841768.133, "dur": 21.399, + "args": { + "External id": 445217,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007841791.168, "dur": 5.784, + "args": { + "External id": 445218,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841795.563, "dur": 1.085, + "args": { + "External id": 445219,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007841797.935, "dur": 24.518, + "args": { + "External id": 445220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007841799.365, "dur": 1.580, + "args": { + "External id": 445221,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007841802.722, "dur": 19.378, + "args": { + "External id": 445222,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007841805.970, "dur": 2.738, + "args": { + "External id": 445223,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007841824.117, "dur": 20.883, + "args": { + "External id": 445224,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007841846.364, "dur": 17.393, + "args": { + "External id": 445225,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007841866.525, "dur": 14.685, + "args": { + "External id": 445226,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007841882.876, "dur": 13.411, + "args": { + "External id": 445227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007841898.258, "dur": 22.533, + "args": { + "External id": 445228,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007841900.563, "dur": 1.821, + "args": { + "External id": 445229,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841905.033, "dur": 1.016, + "args": { + "External id": 445230,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007841922.655, "dur": 12.554, + "args": { + "External id": 445231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007841936.414, "dur": 10.893, + "args": { + "External id": 445232,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007841959.069, "dur": 2.310, + "args": { + "External id": 445233,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007841970.839, "dur": 3.800, + "args": { + "External id": 445234,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007841973.629, "dur": 0.371, + "args": { + "External id": 445235,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007842037.160, "dur": 62.588, + "args": { + "External id": 445236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007842106.379, "dur": 5.926, + "args": { + "External id": 445237,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842109.914, "dur": 0.957, + "args": { + "External id": 445238,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007842113.671, "dur": 26.733, + "args": { + "External id": 445239,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007842145.559, "dur": 7.870, + "args": { + "External id": 445240,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007842147.042, "dur": 5.613, + "args": { + "External id": 445241,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842149.314, "dur": 3.098, + "args": { + "External id": 445242,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007842156.784, "dur": 47.852, + "args": { + "External id": 445243,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007842158.003, "dur": 45.977, + "args": { + "External id": 445244,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007842208.632, "dur": 16.717, + "args": { + "External id": 445245,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007842230.882, "dur": 3.816, + "args": { + "External id": 445246,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842233.203, "dur": 0.757, + "args": { + "External id": 445247,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007842238.734, "dur": 48.073, + "args": { + "External id": 445248,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007842239.924, "dur": 4.274, + "args": { + "External id": 445249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007842240.923, "dur": 2.684, + "args": { + "External id": 445250,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842242.938, "dur": 0.536, + "args": { + "External id": 445251,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007842244.764, "dur": 41.668, + "args": { + "External id": 445252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007842245.630, "dur": 40.304, + "args": { + "External id": 445253,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007842290.862, "dur": 4.193, + "args": { + "External id": 445254,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842292.934, "dur": 1.076, + "args": { + "External id": 445255,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007842300.747, "dur": 1.804, + "args": { + "External id": 445256,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007842310.389, "dur": 7.243, + "args": { + "External id": 445257,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007842312.707, "dur": 4.671, + "args": { + "External id": 445258,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007842402.566, "dur": 191.404, + "args": { + "External id": 445259,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007842404.954, "dur": 2.378, + "args": { + "External id": 445260,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007842411.251, "dur": 182.155, + "args": { + "External id": 445261,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007842412.954, "dur": 0.575, + "args": { + "External id": 445262,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007842415.395, "dur": 22.042, + "args": { + "External id": 445263,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007842438.992, "dur": 6.089, + "args": { + "External id": 445264,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842441.712, "dur": 2.932, + "args": { + "External id": 445265,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007842446.061, "dur": 23.377, + "args": { + "External id": 445266,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007842447.253, "dur": 1.648, + "args": { + "External id": 445267,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007842450.418, "dur": 18.721, + "args": { + "External id": 445268,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007842453.283, "dur": 3.156, + "args": { + "External id": 445269,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007842471.110, "dur": 21.187, + "args": { + "External id": 445270,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007842493.496, "dur": 13.728, + "args": { + "External id": 445271,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007842510.141, "dur": 14.811, + "args": { + "External id": 445272,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007842526.278, "dur": 13.602, + "args": { + "External id": 445273,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007842541.877, "dur": 23.719, + "args": { + "External id": 445274,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007842544.079, "dur": 1.787, + "args": { + "External id": 445275,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842548.242, "dur": 2.928, + "args": { + "External id": 445276,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007842567.105, "dur": 13.247, + "args": { + "External id": 445277,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007842581.584, "dur": 11.012, + "args": { + "External id": 445278,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007842600.202, "dur": 2.095, + "args": { + "External id": 445279,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007842611.144, "dur": 3.939, + "args": { + "External id": 445280,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842613.822, "dur": 0.567, + "args": { + "External id": 445281,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007842717.843, "dur": 49.471, + "args": { + "External id": 445282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007842772.778, "dur": 6.261, + "args": { + "External id": 445283,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842776.329, "dur": 1.355, + "args": { + "External id": 445284,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007842780.290, "dur": 26.235, + "args": { + "External id": 445285,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007842811.451, "dur": 6.621, + "args": { + "External id": 445286,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007842812.991, "dur": 4.420, + "args": { + "External id": 445287,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842815.383, "dur": 1.802, + "args": { + "External id": 445288,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007842820.917, "dur": 42.350, + "args": { + "External id": 445289,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007842822.424, "dur": 40.148, + "args": { + "External id": 445290,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007842866.555, "dur": 15.043, + "args": { + "External id": 445291,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007842886.921, "dur": 4.089, + "args": { + "External id": 445292,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842889.458, "dur": 0.706, + "args": { + "External id": 445293,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007842894.794, "dur": 50.120, + "args": { + "External id": 445294,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007842895.827, "dur": 5.091, + "args": { + "External id": 445295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007842897.472, "dur": 2.894, + "args": { + "External id": 445296,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842899.591, "dur": 0.654, + "args": { + "External id": 445297,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007842901.993, "dur": 42.516, + "args": { + "External id": 445298,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007842902.965, "dur": 41.061, + "args": { + "External id": 445299,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007842948.907, "dur": 3.931, + "args": { + "External id": 445300,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007842950.753, "dur": 0.991, + "args": { + "External id": 445301,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007842958.842, "dur": 1.704, + "args": { + "External id": 445302,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007842968.311, "dur": 6.324, + "args": { + "External id": 445303,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007842970.400, "dur": 3.934, + "args": { + "External id": 445304,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007843054.168, "dur": 199.989, + "args": { + "External id": 445305,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007843058.712, "dur": 2.329, + "args": { + "External id": 445306,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007843063.027, "dur": 190.529, + "args": { + "External id": 445307,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007843064.468, "dur": 0.403, + "args": { + "External id": 445308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007843066.336, "dur": 37.408, + "args": { + "External id": 445309,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007843106.203, "dur": 5.914, + "args": { + "External id": 445310,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843110.277, "dur": 1.397, + "args": { + "External id": 445311,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007843113.105, "dur": 23.916, + "args": { + "External id": 445312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007843114.505, "dur": 2.076, + "args": { + "External id": 445313,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007843118.353, "dur": 18.356, + "args": { + "External id": 445314,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007843121.694, "dur": 2.689, + "args": { + "External id": 445315,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007843138.587, "dur": 18.753, + "args": { + "External id": 445316,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007843158.782, "dur": 16.158, + "args": { + "External id": 445317,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007843177.640, "dur": 14.424, + "args": { + "External id": 445318,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007843193.502, "dur": 13.033, + "args": { + "External id": 445319,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007843208.942, "dur": 19.491, + "args": { + "External id": 445320,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007843210.915, "dur": 1.756, + "args": { + "External id": 445321,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843215.111, "dur": 0.955, + "args": { + "External id": 445322,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007843230.111, "dur": 10.928, + "args": { + "External id": 445323,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007843242.118, "dur": 10.424, + "args": { + "External id": 445324,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007843261.271, "dur": 2.044, + "args": { + "External id": 445325,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007843272.413, "dur": 3.848, + "args": { + "External id": 445326,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843275.088, "dur": 0.416, + "args": { + "External id": 445327,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007843338.701, "dur": 41.404, + "args": { + "External id": 445328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007843384.304, "dur": 5.051, + "args": { + "External id": 445329,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843387.409, "dur": 0.934, + "args": { + "External id": 445330,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007843390.782, "dur": 21.297, + "args": { + "External id": 445331,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007843416.249, "dur": 6.722, + "args": { + "External id": 445332,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007843418.127, "dur": 4.221, + "args": { + "External id": 445333,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843420.745, "dur": 1.417, + "args": { + "External id": 445334,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007843425.544, "dur": 40.302, + "args": { + "External id": 445335,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007843426.962, "dur": 38.329, + "args": { + "External id": 445336,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007843469.356, "dur": 13.010, + "args": { + "External id": 445337,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007843487.581, "dur": 3.580, + "args": { + "External id": 445338,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843489.706, "dur": 0.618, + "args": { + "External id": 445339,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007843494.759, "dur": 46.041, + "args": { + "External id": 445340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007843495.801, "dur": 4.544, + "args": { + "External id": 445341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007843496.970, "dur": 2.849, + "args": { + "External id": 445342,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843498.836, "dur": 0.833, + "args": { + "External id": 445343,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007843500.864, "dur": 39.538, + "args": { + "External id": 445344,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007843501.553, "dur": 38.340, + "args": { + "External id": 445345,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007843544.580, "dur": 3.550, + "args": { + "External id": 445346,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843546.328, "dur": 0.615, + "args": { + "External id": 445347,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007843554.006, "dur": 1.375, + "args": { + "External id": 445348,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007843562.221, "dur": 8.033, + "args": { + "External id": 445349,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007843564.150, "dur": 5.761, + "args": { + "External id": 445350,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007843641.272, "dur": 221.932, + "args": { + "External id": 445351,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007843643.657, "dur": 2.737, + "args": { + "External id": 445352,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7575 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007843647.806, "dur": 214.962, + "args": { + "External id": 445353,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007843649.761, "dur": 0.308, + "args": { + "External id": 445354,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7577 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007843688.494, "dur": 28.471, + "args": { + "External id": 445355,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007843718.816, "dur": 4.297, + "args": { + "External id": 445356,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843721.295, "dur": 1.563, + "args": { + "External id": 445357,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007843724.321, "dur": 29.630, + "args": { + "External id": 445358,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007843725.454, "dur": 1.973, + "args": { + "External id": 445359,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007843728.985, "dur": 24.482, + "args": { + "External id": 445360,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007843734.213, "dur": 2.902, + "args": { + "External id": 445361,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007843755.470, "dur": 19.561, + "args": { + "External id": 445362,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007843776.129, "dur": 11.797, + "args": { + "External id": 445363,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007843791.013, "dur": 12.834, + "args": { + "External id": 445364,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007843805.066, "dur": 11.472, + "args": { + "External id": 445365,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007843818.538, "dur": 18.840, + "args": { + "External id": 445366,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007843820.911, "dur": 1.720, + "args": { + "External id": 445367,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843824.872, "dur": 0.774, + "args": { + "External id": 445368,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007843838.960, "dur": 11.295, + "args": { + "External id": 445369,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007843851.205, "dur": 10.677, + "args": { + "External id": 445370,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007843870.183, "dur": 2.207, + "args": { + "External id": 445371,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007843881.429, "dur": 3.763, + "args": { + "External id": 445372,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007843883.965, "dur": 0.411, + "args": { + "External id": 445373,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007843967.964, "dur": 45.457, + "args": { + "External id": 445374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007844018.335, "dur": 7.902, + "args": { + "External id": 445375,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844021.524, "dur": 3.610, + "args": { + "External id": 445376,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007844028.125, "dur": 22.328, + "args": { + "External id": 445377,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007844054.696, "dur": 6.123, + "args": { + "External id": 445378,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007844056.436, "dur": 3.786, + "args": { + "External id": 445379,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844058.965, "dur": 1.064, + "args": { + "External id": 445380,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007844063.170, "dur": 80.233, + "args": { + "External id": 445381,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007844064.530, "dur": 77.650, + "args": { + "External id": 445382,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007844148.400, "dur": 18.220, + "args": { + "External id": 445383,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007844172.306, "dur": 4.484, + "args": { + "External id": 445384,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844175.034, "dur": 0.844, + "args": { + "External id": 445385,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007844180.808, "dur": 51.614, + "args": { + "External id": 445386,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007844182.032, "dur": 5.376, + "args": { + "External id": 445387,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007844183.039, "dur": 3.758, + "args": { + "External id": 445388,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844185.552, "dur": 1.105, + "args": { + "External id": 445389,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007844188.002, "dur": 44.076, + "args": { + "External id": 445390,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007844189.079, "dur": 42.484, + "args": { + "External id": 445391,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007844236.552, "dur": 3.843, + "args": { + "External id": 445392,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844238.686, "dur": 0.689, + "args": { + "External id": 445393,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007844246.165, "dur": 1.938, + "args": { + "External id": 445394,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007844256.776, "dur": 13.412, + "args": { + "External id": 445395,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007844264.021, "dur": 5.810, + "args": { + "External id": 445396,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007844352.624, "dur": 180.298, + "args": { + "External id": 445397,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007844354.702, "dur": 2.380, + "args": { + "External id": 445398,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007844358.675, "dur": 173.737, + "args": { + "External id": 445399,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007844360.497, "dur": 0.318, + "args": { + "External id": 445400,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007844362.387, "dur": 23.713, + "args": { + "External id": 445401,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007844387.593, "dur": 3.490, + "args": { + "External id": 445402,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844389.507, "dur": 1.179, + "args": { + "External id": 445403,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007844392.473, "dur": 25.477, + "args": { + "External id": 445404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007844393.919, "dur": 1.740, + "args": { + "External id": 445405,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007844397.086, "dur": 20.572, + "args": { + "External id": 445406,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007844402.385, "dur": 2.624, + "args": { + "External id": 445407,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007844419.759, "dur": 19.870, + "args": { + "External id": 445408,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007844441.097, "dur": 12.459, + "args": { + "External id": 445409,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007844456.364, "dur": 12.584, + "args": { + "External id": 445410,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007844470.433, "dur": 12.886, + "args": { + "External id": 445411,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007844485.273, "dur": 19.692, + "args": { + "External id": 445412,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007844487.128, "dur": 1.521, + "args": { + "External id": 445413,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844490.801, "dur": 0.643, + "args": { + "External id": 445414,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007844506.788, "dur": 12.746, + "args": { + "External id": 445415,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007844520.790, "dur": 10.679, + "args": { + "External id": 445416,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007844538.977, "dur": 1.514, + "args": { + "External id": 445417,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007844549.545, "dur": 3.582, + "args": { + "External id": 445418,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844551.904, "dur": 0.446, + "args": { + "External id": 445419,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007844614.620, "dur": 82.064, + "args": { + "External id": 445420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007844703.507, "dur": 6.564, + "args": { + "External id": 445421,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844707.244, "dur": 1.258, + "args": { + "External id": 445422,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007844711.641, "dur": 26.514, + "args": { + "External id": 445423,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007844743.300, "dur": 6.784, + "args": { + "External id": 445424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007844745.415, "dur": 3.956, + "args": { + "External id": 445425,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844747.675, "dur": 1.425, + "args": { + "External id": 445426,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007844753.119, "dur": 49.643, + "args": { + "External id": 445427,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007844755.043, "dur": 46.896, + "args": { + "External id": 445428,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007844806.498, "dur": 16.125, + "args": { + "External id": 445429,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007844828.375, "dur": 3.667, + "args": { + "External id": 445430,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844830.677, "dur": 0.572, + "args": { + "External id": 445431,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007844836.201, "dur": 50.804, + "args": { + "External id": 445432,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007844837.294, "dur": 4.639, + "args": { + "External id": 445433,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007844838.561, "dur": 2.773, + "args": { + "External id": 445434,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844840.485, "dur": 0.728, + "args": { + "External id": 445435,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007844842.923, "dur": 43.712, + "args": { + "External id": 445436,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007844844.328, "dur": 41.802, + "args": { + "External id": 445437,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007844890.899, "dur": 5.879, + "args": { + "External id": 445438,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007844893.188, "dur": 2.562, + "args": { + "External id": 445439,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007844902.955, "dur": 1.881, + "args": { + "External id": 445440,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007844934.120, "dur": 7.606, + "args": { + "External id": 445441,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007844936.721, "dur": 4.708, + "args": { + "External id": 445442,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007845026.779, "dur": 211.160, + "args": { + "External id": 445443,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007845028.886, "dur": 2.283, + "args": { + "External id": 445444,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007845034.790, "dur": 202.740, + "args": { + "External id": 445445,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007845036.281, "dur": 0.388, + "args": { + "External id": 445446,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007845037.712, "dur": 22.136, + "args": { + "External id": 445447,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007845061.310, "dur": 4.712, + "args": { + "External id": 445448,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845063.219, "dur": 2.504, + "args": { + "External id": 445449,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007845066.967, "dur": 40.155, + "args": { + "External id": 445450,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007845067.960, "dur": 1.316, + "args": { + "External id": 445451,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007845070.917, "dur": 35.545, + "args": { + "External id": 445452,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007845073.499, "dur": 2.513, + "args": { + "External id": 445453,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007845109.333, "dur": 23.684, + "args": { + "External id": 445454,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007845134.468, "dur": 13.535, + "args": { + "External id": 445455,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007845151.546, "dur": 16.007, + "args": { + "External id": 445456,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007845168.845, "dur": 13.556, + "args": { + "External id": 445457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007845184.634, "dur": 24.019, + "args": { + "External id": 445458,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007845186.775, "dur": 1.649, + "args": { + "External id": 445459,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845190.771, "dur": 2.597, + "args": { + "External id": 445460,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007845210.389, "dur": 12.891, + "args": { + "External id": 445461,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007845224.460, "dur": 11.626, + "args": { + "External id": 445462,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007845245.285, "dur": 2.612, + "args": { + "External id": 445463,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007845256.701, "dur": 3.275, + "args": { + "External id": 445464,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845258.850, "dur": 0.383, + "args": { + "External id": 445465,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007845323.686, "dur": 47.023, + "args": { + "External id": 445466,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007845375.028, "dur": 5.309, + "args": { + "External id": 445467,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845378.272, "dur": 0.965, + "args": { + "External id": 445468,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007845381.788, "dur": 23.374, + "args": { + "External id": 445469,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007845409.413, "dur": 6.047, + "args": { + "External id": 445470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007845411.067, "dur": 3.581, + "args": { + "External id": 445471,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845412.937, "dur": 1.519, + "args": { + "External id": 445472,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007845418.023, "dur": 42.161, + "args": { + "External id": 445473,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007845419.451, "dur": 40.094, + "args": { + "External id": 445474,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007845463.704, "dur": 16.012, + "args": { + "External id": 445475,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007845484.450, "dur": 24.095, + "args": { + "External id": 445476,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007845486.690, "dur": 21.499, + "args": { + "External id": 445477,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845491.997, "dur": 0.990, + "args": { + "External id": 445478,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007845513.809, "dur": 31.993, + "args": { + "External id": 445479,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007845520.019, "dur": 25.496, + "args": { + "External id": 445480,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 7703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845524.857, "dur": 4.275, + "args": { + "External id": 445481,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007845530.201, "dur": 14.798, + "args": { + "External id": 445482,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007845559.839, "dur": 4.927, + "args": { + "External id": 445483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007845561.953, "dur": 2.572, + "args": { + "External id": 445484,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007845565.863, "dur": 1.216, + "args": { + "External id": 445485,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007845566.552, "dur": 0.455, + "args": { + "External id": 445486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007845607.013, "dur": 22.136, + "args": { + "External id": 445487,"Sequence number": 5285584, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 7710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007845631.299, "dur": 14.262, + "args": { + "External id": 445488,"Sequence number": 5285585, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 7711 + } + }, + { + "ph": "s", "id": 16, "pid": 4183441, "tid": 4183441, "ts": 676007845631.299, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007845651.308, "dur": 46.812, + "args": { + "External id": 445489,"Sequence number": 5285586, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 7712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845694.118, "dur": 1.500, + "args": { + "External id": 445490,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007845701.008, "dur": 7.058, + "args": { + "External id": 445491,"Sequence number": 5285586, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 7714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845706.058, "dur": 0.875, + "args": { + "External id": 445492,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 7715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007845709.731, "dur": 3.670, + "args": { + "External id": 445493,"Sequence number": 5285586, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 7716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845712.022, "dur": 0.806, + "args": { + "External id": 445494,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 7717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007845718.550, "dur": 6.433, + "args": { + "External id": 445495,"Sequence number": 5285586, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7718 + } + }, + { + "ph": "s", "id": 15, "pid": 4183441, "tid": 4183441, "ts": 676007845718.550, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845722.223, "dur": 1.127, + "args": { + "External id": 445496,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007845725.936, "dur": 5.574, + "args": { + "External id": 445497,"Sequence number": 5285587, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 7720 + } + }, + { + "ph": "s", "id": 14, "pid": 4183441, "tid": 4183441, "ts": 676007845725.936, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845730.076, "dur": 0.642, + "args": { + "External id": 445498,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007845732.412, "dur": 5.464, + "args": { + "External id": 445499,"Sequence number": 5285588, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 7722 + } + }, + { + "ph": "s", "id": 13, "pid": 4183441, "tid": 4183441, "ts": 676007845732.412, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845735.856, "dur": 1.033, + "args": { + "External id": 445500,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 7723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007845739.018, "dur": 4.730, + "args": { + "External id": 445501,"Sequence number": 5285589, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 7724 + } + }, + { + "ph": "s", "id": 12, "pid": 4183441, "tid": 4183441, "ts": 676007845739.018, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845742.002, "dur": 0.956, + "args": { + "External id": 445502,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 7725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007845747.612, "dur": 37.201, + "args": { + "External id": 445503,"Sequence number": 5285590, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007845749.205, "dur": 35.392, + "args": { + "External id": 445504,"Sequence number": 5285590, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007845752.036, "dur": 7.498, + "args": { + "External id": 445505,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 7728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007845754.738, "dur": 4.207, + "args": { + "External id": 445506,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007845760.713, "dur": 23.377, + "args": { + "External id": 445507,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 7730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007845812.949, "dur": 6.248, + "args": { + "External id": 445508,"Sequence number": 5285590, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 7731 + } + }, + { + "ph": "s", "id": 11, "pid": 4183441, "tid": 4183441, "ts": 676007845812.949, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007845821.422, "dur": 1.401, + "args": { + "External id": 445509,"Sequence number": 5285591, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 7732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007845855.342, "dur": 23311.142, + "args": { + "External id": 445510,"Sequence number": 5285591, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 7733 + } + }, + { + "ph": "s", "id": 10, "pid": 4183441, "tid": 4183441, "ts": 676007845855.342, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007845869.927, "dur": 28.699, + "args": { + "External id": 445511,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007845870.763, "dur": 27.640, + "args": { + "External id": 445512,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007845872.255, "dur": 6.093, + "args": { + "External id": 445513,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007845874.000, "dur": 3.888, + "args": { + "External id": 445514,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007845879.248, "dur": 18.659, + "args": { + "External id": 445515,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 7738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007845913.396, "dur": 26.186, + "args": { + "External id": 445516,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007845914.713, "dur": 6.981, + "args": { + "External id": 445517,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 7740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845917.252, "dur": 4.117, + "args": { + "External id": 445518,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007845922.907, "dur": 16.404, + "args": { + "External id": 445519,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 7742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007845924.639, "dur": 14.270, + "args": { + "External id": 445520,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 7743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007845942.547, "dur": 20.431, + "args": { + "External id": 445521,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007845943.917, "dur": 4.709, + "args": { + "External id": 445522,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 7745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007845945.404, "dur": 3.009, + "args": { + "External id": 445523,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007845949.135, "dur": 13.647, + "args": { + "External id": 445524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007845949.995, "dur": 12.360, + "args": { + "External id": 445525,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 7748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676007845968.928, "dur": 19.124, + "args": { + "External id": 445526,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 7749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007845972.996, "dur": 2.514, + "args": { + "External id": 445527,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007845976.116, "dur": 11.668, + "args": { + "External id": 445528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 7751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007845976.850, "dur": 10.630, + "args": { + "External id": 445529,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 4183441, + "ts": 676007845993.126, "dur": 23.313, + "args": { + "External id": 445530,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007846019.406, "dur": 51.720, + "args": { + "External id": 445531,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 7754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007846021.480, "dur": 49.177, + "args": { + "External id": 445532,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007846026.565, "dur": 1.414, + "args": { + "External id": 445533,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 7756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007846029.330, "dur": 24.219, + "args": { + "External id": 445534,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007846031.580, "dur": 21.761, + "args": { + "External id": 445535,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 7758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007846036.478, "dur": 2.837, + "args": { + "External id": 445536,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007846040.007, "dur": 12.983, + "args": { + "External id": 445537,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 7760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 4183441, + "ts": 676007846075.214, "dur": 17623.497, + "args": { + "External id": 445538,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 4183441, + "ts": 676007846076.750, "dur": 17621.113, + "args": { + "External id": 445539,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 7762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007863708.427, "dur": 9.468, + "args": { + "External id": 445540,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007863715.346, "dur": 1.050, + "args": { + "External id": 445541,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007863722.899, "dur": 99.109, + "args": { + "External id": 445542,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007863724.559, "dur": 6.751, + "args": { + "External id": 445543,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007863727.046, "dur": 3.273, + "args": { + "External id": 445544,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007863729.116, "dur": 0.887, + "args": { + "External id": 445545,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007863732.702, "dur": 88.607, + "args": { + "External id": 445546,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007863734.502, "dur": 86.077, + "args": { + "External id": 445547,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007863825.209, "dur": 4.054, + "args": { + "External id": 445548,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007863827.118, "dur": 0.958, + "args": { + "External id": 445549,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007863836.043, "dur": 1.994, + "args": { + "External id": 445550,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007863846.989, "dur": 6.493, + "args": { + "External id": 445551,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007863849.390, "dur": 3.815, + "args": { + "External id": 445552,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007863970.047, "dur": 220.620, + "args": { + "External id": 445553,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007863972.741, "dur": 2.525, + "args": { + "External id": 445554,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007863979.221, "dur": 210.915, + "args": { + "External id": 445555,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007863981.348, "dur": 0.544, + "args": { + "External id": 445556,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007863983.868, "dur": 25.399, + "args": { + "External id": 445557,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007864011.039, "dur": 5.005, + "args": { + "External id": 445558,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864013.299, "dur": 2.467, + "args": { + "External id": 445559,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007864017.283, "dur": 24.896, + "args": { + "External id": 445560,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007864018.583, "dur": 1.456, + "args": { + "External id": 445561,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007864021.438, "dur": 20.497, + "args": { + "External id": 445562,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007864024.760, "dur": 3.457, + "args": { + "External id": 445563,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007864044.165, "dur": 23.099, + "args": { + "External id": 445564,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007864068.702, "dur": 27.530, + "args": { + "External id": 445565,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007864100.475, "dur": 19.273, + "args": { + "External id": 445566,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007864121.313, "dur": 13.419, + "args": { + "External id": 445567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007864136.910, "dur": 22.814, + "args": { + "External id": 445568,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007864139.404, "dur": 1.844, + "args": { + "External id": 445569,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864143.558, "dur": 0.927, + "args": { + "External id": 445570,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007864161.728, "dur": 12.946, + "args": { + "External id": 445571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007864176.244, "dur": 12.884, + "args": { + "External id": 445572,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007864197.996, "dur": 2.381, + "args": { + "External id": 445573,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007864207.095, "dur": 3.905, + "args": { + "External id": 445574,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864209.316, "dur": 0.826, + "args": { + "External id": 445575,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007864279.557, "dur": 57.158, + "args": { + "External id": 445576,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007864341.841, "dur": 8.585, + "args": { + "External id": 445577,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864344.953, "dur": 2.720, + "args": { + "External id": 445578,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007864352.240, "dur": 25.770, + "args": { + "External id": 445579,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007864383.212, "dur": 6.732, + "args": { + "External id": 445580,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007864385.131, "dur": 4.021, + "args": { + "External id": 445581,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864387.645, "dur": 1.055, + "args": { + "External id": 445582,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007864393.111, "dur": 45.271, + "args": { + "External id": 445583,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007864394.623, "dur": 43.063, + "args": { + "External id": 445584,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007864442.542, "dur": 15.921, + "args": { + "External id": 445585,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007864464.654, "dur": 3.773, + "args": { + "External id": 445586,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864466.991, "dur": 0.636, + "args": { + "External id": 445587,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007864472.900, "dur": 49.216, + "args": { + "External id": 445588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007864474.093, "dur": 4.119, + "args": { + "External id": 445589,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007864474.893, "dur": 2.732, + "args": { + "External id": 445590,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864476.867, "dur": 0.626, + "args": { + "External id": 445591,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007864479.005, "dur": 42.796, + "args": { + "External id": 445592,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007864479.644, "dur": 41.559, + "args": { + "External id": 445593,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007864525.935, "dur": 4.309, + "args": { + "External id": 445594,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864527.950, "dur": 1.061, + "args": { + "External id": 445595,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007864535.911, "dur": 1.524, + "args": { + "External id": 445596,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007864544.917, "dur": 6.426, + "args": { + "External id": 445597,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007864547.076, "dur": 4.016, + "args": { + "External id": 445598,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007864639.431, "dur": 254.186, + "args": { + "External id": 445599,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007864641.578, "dur": 4.300, + "args": { + "External id": 445600,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007864647.483, "dur": 245.760, + "args": { + "External id": 445601,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007864649.403, "dur": 0.522, + "args": { + "External id": 445602,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007864651.230, "dur": 64.344, + "args": { + "External id": 445603,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007864718.412, "dur": 6.551, + "args": { + "External id": 445604,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864723.369, "dur": 1.292, + "args": { + "External id": 445605,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007864726.014, "dur": 34.820, + "args": { + "External id": 445606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007864727.466, "dur": 1.871, + "args": { + "External id": 445607,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007864741.471, "dur": 19.108, + "args": { + "External id": 445608,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007864744.683, "dur": 2.818, + "args": { + "External id": 445609,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007864762.603, "dur": 22.039, + "args": { + "External id": 445610,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007864786.049, "dur": 17.877, + "args": { + "External id": 445611,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007864806.741, "dur": 15.599, + "args": { + "External id": 445612,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007864823.919, "dur": 14.015, + "args": { + "External id": 445613,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007864839.755, "dur": 21.536, + "args": { + "External id": 445614,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007864841.781, "dur": 1.357, + "args": { + "External id": 445615,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864845.725, "dur": 0.710, + "args": { + "External id": 445616,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007864863.100, "dur": 13.690, + "args": { + "External id": 445617,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007864877.986, "dur": 14.085, + "args": { + "External id": 445618,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007864901.422, "dur": 2.660, + "args": { + "External id": 445619,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007864913.450, "dur": 3.856, + "args": { + "External id": 445620,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007864916.077, "dur": 0.417, + "args": { + "External id": 445621,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007864994.337, "dur": 49.118, + "args": { + "External id": 445622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007865048.034, "dur": 5.379, + "args": { + "External id": 445623,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865051.183, "dur": 0.997, + "args": { + "External id": 445624,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007865054.647, "dur": 43.283, + "args": { + "External id": 445625,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007865104.653, "dur": 7.337, + "args": { + "External id": 445626,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007865106.789, "dur": 4.364, + "args": { + "External id": 445627,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865109.356, "dur": 1.587, + "args": { + "External id": 445628,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007865115.283, "dur": 52.029, + "args": { + "External id": 445629,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007865116.590, "dur": 50.240, + "args": { + "External id": 445630,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007865171.006, "dur": 17.026, + "args": { + "External id": 445631,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007865194.158, "dur": 4.600, + "args": { + "External id": 445632,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865196.992, "dur": 0.698, + "args": { + "External id": 445633,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007865203.139, "dur": 47.806, + "args": { + "External id": 445634,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007865203.970, "dur": 4.845, + "args": { + "External id": 445635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007865205.148, "dur": 3.029, + "args": { + "External id": 445636,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865207.086, "dur": 0.959, + "args": { + "External id": 445637,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007865209.355, "dur": 41.180, + "args": { + "External id": 445638,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007865210.221, "dur": 39.744, + "args": { + "External id": 445639,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007865255.231, "dur": 3.837, + "args": { + "External id": 445640,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865256.774, "dur": 1.149, + "args": { + "External id": 445641,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007865264.795, "dur": 1.645, + "args": { + "External id": 445642,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007865274.810, "dur": 8.218, + "args": { + "External id": 445643,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007865277.185, "dur": 5.563, + "args": { + "External id": 445644,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007865369.621, "dur": 187.317, + "args": { + "External id": 445645,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007865372.219, "dur": 2.331, + "args": { + "External id": 445646,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007865375.898, "dur": 180.546, + "args": { + "External id": 445647,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007865377.711, "dur": 0.409, + "args": { + "External id": 445648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007865379.519, "dur": 24.442, + "args": { + "External id": 445649,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007865405.818, "dur": 3.605, + "args": { + "External id": 445650,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865408.284, "dur": 0.858, + "args": { + "External id": 445651,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007865410.422, "dur": 23.996, + "args": { + "External id": 445652,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007865411.514, "dur": 1.880, + "args": { + "External id": 445653,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007865414.528, "dur": 19.603, + "args": { + "External id": 445654,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007865419.210, "dur": 2.097, + "args": { + "External id": 445655,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007865435.931, "dur": 21.194, + "args": { + "External id": 445656,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007865458.936, "dur": 14.375, + "args": { + "External id": 445657,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007865476.136, "dur": 15.208, + "args": { + "External id": 445658,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007865492.630, "dur": 13.028, + "args": { + "External id": 445659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007865507.530, "dur": 20.229, + "args": { + "External id": 445660,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007865509.504, "dur": 1.468, + "args": { + "External id": 445661,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865512.908, "dur": 1.149, + "args": { + "External id": 445662,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007865529.693, "dur": 12.862, + "args": { + "External id": 445663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007865543.591, "dur": 11.954, + "args": { + "External id": 445664,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007865563.200, "dur": 1.597, + "args": { + "External id": 445665,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007865573.607, "dur": 2.959, + "args": { + "External id": 445666,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865575.245, "dur": 0.564, + "args": { + "External id": 445667,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007865635.848, "dur": 83.753, + "args": { + "External id": 445668,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007865726.594, "dur": 6.541, + "args": { + "External id": 445669,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865730.282, "dur": 1.478, + "args": { + "External id": 445670,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007865734.584, "dur": 24.791, + "args": { + "External id": 445671,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007865764.707, "dur": 5.570, + "args": { + "External id": 445672,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007865766.530, "dur": 3.055, + "args": { + "External id": 445673,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865768.528, "dur": 0.874, + "args": { + "External id": 445674,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007865772.964, "dur": 42.147, + "args": { + "External id": 445675,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007865774.617, "dur": 39.876, + "args": { + "External id": 445676,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007865818.700, "dur": 15.673, + "args": { + "External id": 445677,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007865840.142, "dur": 3.999, + "args": { + "External id": 445678,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865842.429, "dur": 0.878, + "args": { + "External id": 445679,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007865848.038, "dur": 52.776, + "args": { + "External id": 445680,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007865849.116, "dur": 5.865, + "args": { + "External id": 445681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007865850.167, "dur": 4.246, + "args": { + "External id": 445682,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865851.907, "dur": 2.327, + "args": { + "External id": 445683,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007865855.665, "dur": 44.819, + "args": { + "External id": 445684,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007865856.593, "dur": 43.280, + "args": { + "External id": 445685,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007865904.382, "dur": 3.815, + "args": { + "External id": 445686,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007865906.400, "dur": 0.644, + "args": { + "External id": 445687,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007865914.023, "dur": 1.537, + "args": { + "External id": 445688,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007865922.567, "dur": 7.103, + "args": { + "External id": 445689,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007865925.015, "dur": 4.394, + "args": { + "External id": 445690,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007866011.186, "dur": 206.247, + "args": { + "External id": 445691,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007866013.796, "dur": 2.138, + "args": { + "External id": 445692,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007866017.551, "dur": 199.499, + "args": { + "External id": 445693,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007866018.969, "dur": 0.589, + "args": { + "External id": 445694,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007866023.119, "dur": 20.967, + "args": { + "External id": 445695,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007866045.703, "dur": 3.167, + "args": { + "External id": 445696,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866047.785, "dur": 0.837, + "args": { + "External id": 445697,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007866050.003, "dur": 24.627, + "args": { + "External id": 445698,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007866051.349, "dur": 3.540, + "args": { + "External id": 445699,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007866056.263, "dur": 17.987, + "args": { + "External id": 445700,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007866058.837, "dur": 2.940, + "args": { + "External id": 445701,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007866076.233, "dur": 38.434, + "args": { + "External id": 445702,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007866116.826, "dur": 14.733, + "args": { + "External id": 445703,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007866134.515, "dur": 14.620, + "args": { + "External id": 445704,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007866150.542, "dur": 13.382, + "args": { + "External id": 445705,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007866166.236, "dur": 22.787, + "args": { + "External id": 445706,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007866168.502, "dur": 2.177, + "args": { + "External id": 445707,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866173.111, "dur": 1.191, + "args": { + "External id": 445708,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007866190.990, "dur": 12.837, + "args": { + "External id": 445709,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007866204.967, "dur": 10.907, + "args": { + "External id": 445710,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007866224.607, "dur": 2.123, + "args": { + "External id": 445711,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007866235.228, "dur": 3.544, + "args": { + "External id": 445712,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866237.530, "dur": 0.528, + "args": { + "External id": 445713,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007866302.913, "dur": 44.249, + "args": { + "External id": 445714,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007866351.198, "dur": 5.356, + "args": { + "External id": 445715,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866354.302, "dur": 1.213, + "args": { + "External id": 445716,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007866357.697, "dur": 21.245, + "args": { + "External id": 445717,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007866382.929, "dur": 7.717, + "args": { + "External id": 445718,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007866384.828, "dur": 5.245, + "args": { + "External id": 445719,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866387.082, "dur": 2.794, + "args": { + "External id": 445720,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007866392.868, "dur": 40.204, + "args": { + "External id": 445721,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007866394.191, "dur": 38.262, + "args": { + "External id": 445722,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007866436.429, "dur": 15.611, + "args": { + "External id": 445723,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007866457.288, "dur": 4.465, + "args": { + "External id": 445724,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866459.749, "dur": 1.161, + "args": { + "External id": 445725,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007866465.270, "dur": 60.420, + "args": { + "External id": 445726,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007866466.267, "dur": 4.314, + "args": { + "External id": 445727,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007866467.077, "dur": 2.990, + "args": { + "External id": 445728,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866468.920, "dur": 1.020, + "args": { + "External id": 445729,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007866485.177, "dur": 40.192, + "args": { + "External id": 445730,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007866486.233, "dur": 38.608, + "args": { + "External id": 445731,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007866529.882, "dur": 3.652, + "args": { + "External id": 445732,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866531.619, "dur": 0.833, + "args": { + "External id": 445733,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007866538.894, "dur": 1.442, + "args": { + "External id": 445734,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 7957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007866547.282, "dur": 7.648, + "args": { + "External id": 445735,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 7958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007866549.244, "dur": 5.406, + "args": { + "External id": 445736,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007866627.876, "dur": 231.716, + "args": { + "External id": 445737,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007866630.123, "dur": 2.266, + "args": { + "External id": 445738,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007866633.576, "dur": 225.389, + "args": { + "External id": 445739,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 7962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007866635.371, "dur": 0.285, + "args": { + "External id": 445740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007866637.035, "dur": 60.600, + "args": { + "External id": 445741,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 7964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007866700.526, "dur": 4.060, + "args": { + "External id": 445742,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 7965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866702.897, "dur": 1.339, + "args": { + "External id": 445743,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 7966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007866705.484, "dur": 29.774, + "args": { + "External id": 445744,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007866707.084, "dur": 2.201, + "args": { + "External id": 445745,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007866710.698, "dur": 24.290, + "args": { + "External id": 445746,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 7969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007866716.038, "dur": 2.770, + "args": { + "External id": 445747,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007866736.743, "dur": 21.787, + "args": { + "External id": 445748,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007866759.785, "dur": 13.643, + "args": { + "External id": 445749,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007866775.897, "dur": 15.119, + "args": { + "External id": 445750,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 7973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007866792.327, "dur": 12.705, + "args": { + "External id": 445751,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 7974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007866806.891, "dur": 22.463, + "args": { + "External id": 445752,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 7975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007866809.116, "dur": 1.554, + "args": { + "External id": 445753,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 7976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866812.870, "dur": 0.904, + "args": { + "External id": 445754,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 7977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007866830.889, "dur": 14.055, + "args": { + "External id": 445755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 7978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007866846.113, "dur": 11.788, + "args": { + "External id": 445756,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 7979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007866866.950, "dur": 2.026, + "args": { + "External id": 445757,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 7980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007866878.093, "dur": 3.850, + "args": { + "External id": 445758,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 7981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866880.711, "dur": 0.384, + "args": { + "External id": 445759,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 7982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007866943.886, "dur": 46.343, + "args": { + "External id": 445760,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 7983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007866995.129, "dur": 4.562, + "args": { + "External id": 445761,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007866997.853, "dur": 0.879, + "args": { + "External id": 445762,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007867000.806, "dur": 23.037, + "args": { + "External id": 445763,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 7986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007867028.114, "dur": 6.127, + "args": { + "External id": 445764,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 7987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007867029.669, "dur": 3.915, + "args": { + "External id": 445765,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 7988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867031.986, "dur": 1.388, + "args": { + "External id": 445766,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 7989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007867036.448, "dur": 38.954, + "args": { + "External id": 445767,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007867037.428, "dur": 37.417, + "args": { + "External id": 445768,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 7991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007867078.645, "dur": 35.220, + "args": { + "External id": 445769,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 7992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007867121.874, "dur": 4.867, + "args": { + "External id": 445770,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 7993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867124.365, "dur": 1.257, + "args": { + "External id": 445771,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 7994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007867130.754, "dur": 52.884, + "args": { + "External id": 445772,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 7995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007867131.894, "dur": 4.820, + "args": { + "External id": 445773,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 7996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007867132.962, "dur": 3.036, + "args": { + "External id": 445774,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 7997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867134.983, "dur": 0.864, + "args": { + "External id": 445775,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 7998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007867137.258, "dur": 46.020, + "args": { + "External id": 445776,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 7999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007867137.872, "dur": 44.888, + "args": { + "External id": 445777,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007867187.629, "dur": 5.219, + "args": { + "External id": 445778,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867189.241, "dur": 2.516, + "args": { + "External id": 445779,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007867198.873, "dur": 1.443, + "args": { + "External id": 445780,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867208.258, "dur": 6.671, + "args": { + "External id": 445781,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867210.363, "dur": 4.281, + "args": { + "External id": 445782,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007867298.193, "dur": 182.127, + "args": { + "External id": 445783,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867300.415, "dur": 2.372, + "args": { + "External id": 445784,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007867304.458, "dur": 175.398, + "args": { + "External id": 445785,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007867305.928, "dur": 0.622, + "args": { + "External id": 445786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007867308.192, "dur": 23.253, + "args": { + "External id": 445787,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007867332.988, "dur": 3.743, + "args": { + "External id": 445788,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867335.408, "dur": 1.068, + "args": { + "External id": 445789,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007867337.668, "dur": 24.886, + "args": { + "External id": 445790,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867338.691, "dur": 1.671, + "args": { + "External id": 445791,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007867341.513, "dur": 20.741, + "args": { + "External id": 445792,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007867346.409, "dur": 2.550, + "args": { + "External id": 445793,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007867364.119, "dur": 20.368, + "args": { + "External id": 445794,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007867385.868, "dur": 14.024, + "args": { + "External id": 445795,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007867402.781, "dur": 15.097, + "args": { + "External id": 445796,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007867419.341, "dur": 13.304, + "args": { + "External id": 445797,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007867434.470, "dur": 20.284, + "args": { + "External id": 445798,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007867437.024, "dur": 1.339, + "args": { + "External id": 445799,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867440.910, "dur": 1.015, + "args": { + "External id": 445800,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007867456.086, "dur": 11.324, + "args": { + "External id": 445801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007867468.455, "dur": 10.460, + "args": { + "External id": 445802,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007867485.921, "dur": 1.399, + "args": { + "External id": 445803,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007867494.761, "dur": 3.265, + "args": { + "External id": 445804,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867496.905, "dur": 0.354, + "args": { + "External id": 445805,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007867558.584, "dur": 39.102, + "args": { + "External id": 445806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007867602.059, "dur": 5.094, + "args": { + "External id": 445807,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867604.764, "dur": 1.358, + "args": { + "External id": 445808,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007867608.572, "dur": 24.347, + "args": { + "External id": 445809,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007867637.254, "dur": 6.071, + "args": { + "External id": 445810,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007867638.884, "dur": 3.837, + "args": { + "External id": 445811,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867640.994, "dur": 1.499, + "args": { + "External id": 445812,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007867645.480, "dur": 82.121, + "args": { + "External id": 445813,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007867646.690, "dur": 79.922, + "args": { + "External id": 445814,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007867732.633, "dur": 15.299, + "args": { + "External id": 445815,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007867754.311, "dur": 4.734, + "args": { + "External id": 445816,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867756.977, "dur": 1.000, + "args": { + "External id": 445817,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007867763.111, "dur": 49.611, + "args": { + "External id": 445818,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007867764.071, "dur": 6.846, + "args": { + "External id": 445819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007867765.089, "dur": 5.242, + "args": { + "External id": 445820,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867769.535, "dur": 0.625, + "args": { + "External id": 445821,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007867771.494, "dur": 40.881, + "args": { + "External id": 445822,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007867772.352, "dur": 39.577, + "args": { + "External id": 445823,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007867817.090, "dur": 4.244, + "args": { + "External id": 445824,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867819.143, "dur": 1.087, + "args": { + "External id": 445825,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007867827.288, "dur": 1.664, + "args": { + "External id": 445826,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867837.034, "dur": 5.629, + "args": { + "External id": 445827,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867838.584, "dur": 3.808, + "args": { + "External id": 445828,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007867926.157, "dur": 255.573, + "args": { + "External id": 445829,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867928.128, "dur": 2.355, + "args": { + "External id": 445830,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007867932.302, "dur": 249.039, + "args": { + "External id": 445831,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007867936.168, "dur": 0.397, + "args": { + "External id": 445832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007867937.926, "dur": 24.289, + "args": { + "External id": 445833,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007867964.237, "dur": 3.489, + "args": { + "External id": 445834,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007867966.197, "dur": 1.242, + "args": { + "External id": 445835,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007867968.825, "dur": 35.782, + "args": { + "External id": 445836,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007867971.942, "dur": 1.464, + "args": { + "External id": 445837,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007867974.672, "dur": 29.671, + "args": { + "External id": 445838,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007867977.185, "dur": 2.320, + "args": { + "External id": 445839,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007868006.235, "dur": 40.612, + "args": { + "External id": 445840,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007868048.282, "dur": 30.035, + "args": { + "External id": 445841,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007868081.026, "dur": 31.996, + "args": { + "External id": 445842,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007868115.066, "dur": 16.965, + "args": { + "External id": 445843,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007868133.848, "dur": 20.814, + "args": { + "External id": 445844,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007868135.846, "dur": 1.998, + "args": { + "External id": 445845,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868140.396, "dur": 1.044, + "args": { + "External id": 445846,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007868156.149, "dur": 11.855, + "args": { + "External id": 445847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007868169.248, "dur": 10.946, + "args": { + "External id": 445848,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007868188.938, "dur": 2.042, + "args": { + "External id": 445849,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007868199.430, "dur": 3.509, + "args": { + "External id": 445850,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868201.789, "dur": 0.404, + "args": { + "External id": 445851,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007868264.286, "dur": 45.054, + "args": { + "External id": 445852,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007868327.503, "dur": 7.384, + "args": { + "External id": 445853,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868330.592, "dur": 3.158, + "args": { + "External id": 445854,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007868336.584, "dur": 23.814, + "args": { + "External id": 445855,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007868365.292, "dur": 5.683, + "args": { + "External id": 445856,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007868366.768, "dur": 3.560, + "args": { + "External id": 445857,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868368.934, "dur": 1.022, + "args": { + "External id": 445858,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007868373.747, "dur": 40.648, + "args": { + "External id": 445859,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007868375.091, "dur": 38.730, + "args": { + "External id": 445860,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007868417.818, "dur": 14.978, + "args": { + "External id": 445861,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007868438.181, "dur": 3.498, + "args": { + "External id": 445862,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868440.279, "dur": 0.528, + "args": { + "External id": 445863,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007868445.251, "dur": 46.312, + "args": { + "External id": 445864,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007868446.364, "dur": 4.222, + "args": { + "External id": 445865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007868447.309, "dur": 2.749, + "args": { + "External id": 445866,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868449.005, "dur": 0.923, + "args": { + "External id": 445867,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007868451.170, "dur": 40.008, + "args": { + "External id": 445868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007868451.725, "dur": 38.978, + "args": { + "External id": 445869,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007868495.313, "dur": 3.381, + "args": { + "External id": 445870,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868497.070, "dur": 0.550, + "args": { + "External id": 445871,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007868503.573, "dur": 1.473, + "args": { + "External id": 445872,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007868511.875, "dur": 5.744, + "args": { + "External id": 445873,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007868513.530, "dur": 3.825, + "args": { + "External id": 445874,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007868591.903, "dur": 220.034, + "args": { + "External id": 445875,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007868594.103, "dur": 4.114, + "args": { + "External id": 445876,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007868599.574, "dur": 211.947, + "args": { + "External id": 445877,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007868601.400, "dur": 0.511, + "args": { + "External id": 445878,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007868603.209, "dur": 19.560, + "args": { + "External id": 445879,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007868624.318, "dur": 5.460, + "args": { + "External id": 445880,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868628.777, "dur": 0.748, + "args": { + "External id": 445881,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007868630.595, "dur": 22.145, + "args": { + "External id": 445882,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007868632.022, "dur": 1.312, + "args": { + "External id": 445883,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007868634.507, "dur": 17.957, + "args": { + "External id": 445884,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007868637.027, "dur": 2.122, + "args": { + "External id": 445885,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007868689.398, "dur": 23.915, + "args": { + "External id": 445886,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007868715.180, "dur": 14.964, + "args": { + "External id": 445887,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007868733.153, "dur": 14.150, + "args": { + "External id": 445888,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007868748.728, "dur": 12.968, + "args": { + "External id": 445889,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007868763.579, "dur": 22.250, + "args": { + "External id": 445890,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007868765.776, "dur": 1.888, + "args": { + "External id": 445891,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868770.070, "dur": 3.150, + "args": { + "External id": 445892,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007868787.796, "dur": 10.880, + "args": { + "External id": 445893,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007868799.551, "dur": 10.607, + "args": { + "External id": 445894,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007868819.624, "dur": 2.160, + "args": { + "External id": 445895,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007868830.483, "dur": 3.407, + "args": { + "External id": 445896,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868832.583, "dur": 0.460, + "args": { + "External id": 445897,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007868900.270, "dur": 43.066, + "args": { + "External id": 445898,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007868947.863, "dur": 5.041, + "args": { + "External id": 445899,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868950.689, "dur": 1.215, + "args": { + "External id": 445900,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007868954.120, "dur": 20.244, + "args": { + "External id": 445901,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007868978.871, "dur": 6.222, + "args": { + "External id": 445902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007868980.758, "dur": 3.722, + "args": { + "External id": 445903,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007868982.791, "dur": 1.481, + "args": { + "External id": 445904,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007868987.847, "dur": 38.196, + "args": { + "External id": 445905,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007868989.031, "dur": 36.473, + "args": { + "External id": 445906,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007869029.309, "dur": 12.692, + "args": { + "External id": 445907,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007869046.362, "dur": 21.375, + "args": { + "External id": 445908,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007869048.798, "dur": 18.579, + "args": { + "External id": 445909,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869053.489, "dur": 1.241, + "args": { + "External id": 445910,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007869072.854, "dur": 45.077, + "args": { + "External id": 445911,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007869075.005, "dur": 42.654, + "args": { + "External id": 445912,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 8135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869079.785, "dur": 20.768, + "args": { + "External id": 445913,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007869102.680, "dur": 14.480, + "args": { + "External id": 445914,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007869130.845, "dur": 5.728, + "args": { + "External id": 445915,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007869133.233, "dur": 3.075, + "args": { + "External id": 445916,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007869137.702, "dur": 1.681, + "args": { + "External id": 445917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007869138.408, "dur": 0.908, + "args": { + "External id": 445918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007869183.578, "dur": 19.964, + "args": { + "External id": 445919,"Sequence number": 5285592, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007869205.588, "dur": 13.466, + "args": { + "External id": 445920,"Sequence number": 5285593, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8143 + } + }, + { + "ph": "s", "id": 9, "pid": 4183441, "tid": 4183441, "ts": 676007869205.588, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007869224.840, "dur": 6.096, + "args": { + "External id": 445921,"Sequence number": 5285594, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 8144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869228.343, "dur": 1.225, + "args": { + "External id": 445922,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007869233.525, "dur": 7.095, + "args": { + "External id": 445923,"Sequence number": 5285594, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "3"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 8146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869238.417, "dur": 0.876, + "args": { + "External id": 445924,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007869242.089, "dur": 3.570, + "args": { + "External id": 445925,"Sequence number": 5285594, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 8148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869244.027, "dur": 1.066, + "args": { + "External id": 445926,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 8149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007869249.739, "dur": 6.231, + "args": { + "External id": 445927,"Sequence number": 5285594, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 8150 + } + }, + { + "ph": "s", "id": 8, "pid": 4183441, "tid": 4183441, "ts": 676007869249.739, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869253.478, "dur": 1.041, + "args": { + "External id": 445928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 8151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007869257.410, "dur": 5.402, + "args": { + "External id": 445929,"Sequence number": 5285595, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], [], []], "Ev Idx": 8152 + } + }, + { + "ph": "s", "id": 7, "pid": 4183441, "tid": 4183441, "ts": 676007869257.410, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869260.928, "dur": 1.036, + "args": { + "External id": 445930,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 1024]", "[16777216, 4096, 1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 8153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 4183441, "tid": 4183441, + "ts": 676007869263.965, "dur": 5.999, + "args": { + "External id": 445931,"Sequence number": 5285596, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], []], "Input Dims": [[16, 4096, 4, 1024], [], []], "Ev Idx": 8154 + } + }, + { + "ph": "s", "id": 6, "pid": 4183441, "tid": 4183441, "ts": 676007869263.965, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869268.198, "dur": 0.904, + "args": { + "External id": 445932,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1024, 1], [], [], []], "Input Dims": [[16, 4096, 4, 1024], [], [], []], "Ev Idx": 8155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007869271.071, "dur": 4.708, + "args": { + "External id": 445933,"Sequence number": 5285597, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], [], []], "Ev Idx": 8156 + } + }, + { + "ph": "s", "id": 5, "pid": 4183441, "tid": 4183441, "ts": 676007869271.071, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869274.120, "dur": 0.916, + "args": { + "External id": 445934,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1024]", "[16777216, 4096, 1]", "3072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[16777216, 4096, 1], [], [], []], "Input Dims": [[16, 4096, 1024], [], [], []], "Ev Idx": 8157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007869279.514, "dur": 29.755, + "args": { + "External id": 445935,"Sequence number": 5285598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007869280.905, "dur": 28.112, + "args": { + "External id": 445936,"Sequence number": 5285598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007869283.724, "dur": 7.220, + "args": { + "External id": 445937,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 8160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007869286.196, "dur": 4.234, + "args": { + "External id": 445938,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007869291.771, "dur": 16.818, + "args": { + "External id": 445939,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 8162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007869336.354, "dur": 5.979, + "args": { + "External id": 445940,"Sequence number": 5285598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 1024]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[16777216, 4096, 1], []], "Input Dims": [[16, 4096, 1024], []], "Ev Idx": 8163 + } + }, + { + "ph": "s", "id": 4, "pid": 4183441, "tid": 4183441, "ts": 676007869336.354, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007869344.704, "dur": 1.671, + "args": { + "External id": 445941,"Sequence number": 5285599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 4183441, "tid": 4183441, + "ts": 676007869378.346, "dur": 24160.145, + "args": { + "External id": 445942,"Sequence number": 5285599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [1], [1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [65536], [32000, 1024], [], [], [], [], []], "Ev Idx": 8165 + } + }, + { + "ph": "s", "id": 3, "pid": 4183441, "tid": 4183441, "ts": 676007869378.346, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 4183441, "tid": 4183441, + "ts": 676007869392.439, "dur": 25.377, + "args": { + "External id": 445943,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 8166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676007869393.370, "dur": 24.223, + "args": { + "External id": 445944,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 8167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007869394.524, "dur": 5.506, + "args": { + "External id": 445945,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[4096, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 8168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007869396.127, "dur": 3.501, + "args": { + "External id": 445946,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007869400.827, "dur": 16.393, + "args": { + "External id": 445947,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [4096, 1], []], "Input Dims": [[65536, 1024], [65536, 1024], []], "Ev Idx": 8170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007869432.768, "dur": 25.142, + "args": { + "External id": 445948,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 8171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007869434.024, "dur": 6.676, + "args": { + "External id": 445949,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], [], []], "Ev Idx": 8172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869436.527, "dur": 3.811, + "args": { + "External id": 445950,"Record function id": 0, "Concrete Inputs": ["[65536, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007869442.120, "dur": 15.550, + "args": { + "External id": 445951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007869443.837, "dur": 13.497, + "args": { + "External id": 445952,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[65536, 1024], []], "Ev Idx": 8175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 4183441, "tid": 4183441, + "ts": 676007869486.379, "dur": 18.989, + "args": { + "External id": 445953,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007869487.183, "dur": 5.211, + "args": { + "External id": 445954,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869489.092, "dur": 3.062, + "args": { + "External id": 445955,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007869492.965, "dur": 12.213, + "args": { + "External id": 445956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007869493.325, "dur": 11.493, + "args": { + "External id": 445957,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1024, 1], []], "Input Dims": [[32000, 1024], []], "Ev Idx": 8180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676007869511.154, "dur": 17.217, + "args": { + "External id": 445958,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007869515.358, "dur": 2.245, + "args": { + "External id": 445959,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676007869518.154, "dur": 9.961, + "args": { + "External id": 445960,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 8183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007869518.743, "dur": 8.907, + "args": { + "External id": 445961,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 4183441, + "ts": 676007869533.467, "dur": 20.199, + "args": { + "External id": 445962,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007869556.599, "dur": 46.539, + "args": { + "External id": 445963,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007869558.539, "dur": 44.107, + "args": { + "External id": 445964,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869562.289, "dur": 1.461, + "args": { + "External id": 445965,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007869564.995, "dur": 22.528, + "args": { + "External id": 445966,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007869566.354, "dur": 20.978, + "args": { + "External id": 445967,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 8190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007869570.856, "dur": 2.411, + "args": { + "External id": 445968,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007869574.045, "dur": 12.864, + "args": { + "External id": 445969,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 8192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 4183441, + "ts": 676007869607.150, "dur": 18381.153, + "args": { + "External id": 445970,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 4183441, + "ts": 676007869608.381, "dur": 18378.901, + "args": { + "External id": 445971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007887998.296, "dur": 6.964, + "args": { + "External id": 445972,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888002.349, "dur": 1.005, + "args": { + "External id": 445973,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007888010.463, "dur": 117.847, + "args": { + "External id": 445974,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007888012.371, "dur": 6.202, + "args": { + "External id": 445975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007888014.374, "dur": 3.157, + "args": { + "External id": 445976,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888016.348, "dur": 0.894, + "args": { + "External id": 445977,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007888020.044, "dur": 107.495, + "args": { + "External id": 445978,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007888021.581, "dur": 104.671, + "args": { + "External id": 445979,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007888133.229, "dur": 4.977, + "args": { + "External id": 445980,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888135.961, "dur": 1.007, + "args": { + "External id": 445981,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007888145.839, "dur": 3.034, + "args": { + "External id": 445982,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007888163.574, "dur": 7.128, + "args": { + "External id": 445983,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007888165.951, "dur": 4.479, + "args": { + "External id": 445984,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007888303.704, "dur": 207.366, + "args": { + "External id": 445985,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007888308.727, "dur": 2.571, + "args": { + "External id": 445986,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007888313.150, "dur": 197.537, + "args": { + "External id": 445987,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007888315.141, "dur": 0.690, + "args": { + "External id": 445988,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007888317.652, "dur": 26.884, + "args": { + "External id": 445989,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007888346.517, "dur": 5.690, + "args": { + "External id": 445990,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888351.141, "dur": 0.741, + "args": { + "External id": 445991,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007888353.672, "dur": 26.171, + "args": { + "External id": 445992,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007888354.975, "dur": 1.381, + "args": { + "External id": 445993,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007888357.782, "dur": 21.768, + "args": { + "External id": 445994,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007888361.633, "dur": 3.495, + "args": { + "External id": 445995,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007888381.741, "dur": 23.763, + "args": { + "External id": 445996,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007888407.459, "dur": 18.296, + "args": { + "External id": 445997,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007888429.227, "dur": 15.484, + "args": { + "External id": 445998,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007888446.521, "dur": 13.234, + "args": { + "External id": 445999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007888461.592, "dur": 20.319, + "args": { + "External id": 446000,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007888463.750, "dur": 1.548, + "args": { + "External id": 446001,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888468.276, "dur": 1.017, + "args": { + "External id": 446002,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007888483.524, "dur": 12.357, + "args": { + "External id": 446003,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007888497.579, "dur": 12.146, + "args": { + "External id": 446004,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007888517.607, "dur": 2.071, + "args": { + "External id": 446005,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007888526.861, "dur": 4.099, + "args": { + "External id": 446006,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888529.086, "dur": 0.893, + "args": { + "External id": 446007,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007888606.619, "dur": 96.837, + "args": { + "External id": 446008,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007888710.873, "dur": 13.493, + "args": { + "External id": 446009,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888719.767, "dur": 1.346, + "args": { + "External id": 446010,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007888726.254, "dur": 27.926, + "args": { + "External id": 446011,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007888760.519, "dur": 8.737, + "args": { + "External id": 446012,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007888762.339, "dur": 6.191, + "args": { + "External id": 446013,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888764.540, "dur": 3.694, + "args": { + "External id": 446014,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007888773.348, "dur": 53.770, + "args": { + "External id": 446015,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007888774.875, "dur": 51.710, + "args": { + "External id": 446016,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007888831.805, "dur": 17.195, + "args": { + "External id": 446017,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007888855.747, "dur": 5.042, + "args": { + "External id": 446018,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888858.317, "dur": 1.323, + "args": { + "External id": 446019,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007888865.596, "dur": 51.573, + "args": { + "External id": 446020,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007888866.714, "dur": 5.059, + "args": { + "External id": 446021,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007888867.826, "dur": 3.333, + "args": { + "External id": 446022,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888869.993, "dur": 1.006, + "args": { + "External id": 446023,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007888872.722, "dur": 44.014, + "args": { + "External id": 446024,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007888873.426, "dur": 42.870, + "args": { + "External id": 446025,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007888921.422, "dur": 3.593, + "args": { + "External id": 446026,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007888923.028, "dur": 0.948, + "args": { + "External id": 446027,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007888931.902, "dur": 1.763, + "args": { + "External id": 446028,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007888942.488, "dur": 7.065, + "args": { + "External id": 446029,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007888944.992, "dur": 4.228, + "args": { + "External id": 446030,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007889047.154, "dur": 260.026, + "args": { + "External id": 446031,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007889049.887, "dur": 2.663, + "args": { + "External id": 446032,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007889055.986, "dur": 250.612, + "args": { + "External id": 446033,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007889057.649, "dur": 0.333, + "args": { + "External id": 446034,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007889059.715, "dur": 20.728, + "args": { + "External id": 446035,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007889097.353, "dur": 7.013, + "args": { + "External id": 446036,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889100.136, "dur": 3.743, + "args": { + "External id": 446037,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007889105.689, "dur": 26.094, + "args": { + "External id": 446038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007889107.325, "dur": 2.818, + "args": { + "External id": 446039,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007889111.768, "dur": 19.724, + "args": { + "External id": 446040,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007889115.352, "dur": 3.334, + "args": { + "External id": 446041,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007889133.409, "dur": 21.379, + "args": { + "External id": 446042,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007889156.138, "dur": 12.696, + "args": { + "External id": 446043,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8266 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007889171.981, "dur": 13.777, + "args": { + "External id": 446044,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007889187.273, "dur": 13.462, + "args": { + "External id": 446045,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007889202.571, "dur": 22.311, + "args": { + "External id": 446046,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007889204.433, "dur": 1.900, + "args": { + "External id": 446047,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8270 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889208.503, "dur": 2.751, + "args": { + "External id": 446048,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007889226.509, "dur": 34.526, + "args": { + "External id": 446049,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007889262.519, "dur": 43.184, + "args": { + "External id": 446050,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007889315.399, "dur": 2.477, + "args": { + "External id": 446051,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007889327.447, "dur": 3.812, + "args": { + "External id": 446052,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889329.834, "dur": 0.472, + "args": { + "External id": 446053,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007889410.467, "dur": 46.540, + "args": { + "External id": 446054,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007889461.993, "dur": 4.550, + "args": { + "External id": 446055,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889464.400, "dur": 1.010, + "args": { + "External id": 446056,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "8388608"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007889467.993, "dur": 23.364, + "args": { + "External id": 446057,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007889504.414, "dur": 8.743, + "args": { + "External id": 446058,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007889506.413, "dur": 5.894, + "args": { + "External id": 446059,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889509.229, "dur": 2.808, + "args": { + "External id": 446060,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007889515.897, "dur": 42.974, + "args": { + "External id": 446061,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007889517.180, "dur": 41.033, + "args": { + "External id": 446062,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007889562.689, "dur": 13.483, + "args": { + "External id": 446063,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007889581.855, "dur": 3.642, + "args": { + "External id": 446064,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889583.717, "dur": 0.974, + "args": { + "External id": 446065,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007889589.289, "dur": 46.660, + "args": { + "External id": 446066,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007889590.314, "dur": 4.051, + "args": { + "External id": 446067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007889591.537, "dur": 2.282, + "args": { + "External id": 446068,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889592.992, "dur": 0.673, + "args": { + "External id": 446069,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007889595.098, "dur": 40.501, + "args": { + "External id": 446070,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007889595.858, "dur": 39.257, + "args": { + "External id": 446071,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007889640.194, "dur": 3.402, + "args": { + "External id": 446072,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889641.959, "dur": 0.656, + "args": { + "External id": 446073,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007889648.931, "dur": 1.377, + "args": { + "External id": 446074,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007889695.922, "dur": 8.016, + "args": { + "External id": 446075,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8298 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007889698.349, "dur": 5.145, + "args": { + "External id": 446076,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8299 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007889795.357, "dur": 177.926, + "args": { + "External id": 446077,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007889797.596, "dur": 2.270, + "args": { + "External id": 446078,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007889803.715, "dur": 169.100, + "args": { + "External id": 446079,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007889805.405, "dur": 0.617, + "args": { + "External id": 446080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007889807.472, "dur": 20.691, + "args": { + "External id": 446081,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007889829.724, "dur": 5.882, + "args": { + "External id": 446082,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889832.015, "dur": 3.244, + "args": { + "External id": 446083,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007889836.619, "dur": 21.459, + "args": { + "External id": 446084,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007889837.941, "dur": 1.558, + "args": { + "External id": 446085,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007889841.255, "dur": 16.546, + "args": { + "External id": 446086,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007889844.163, "dur": 2.620, + "args": { + "External id": 446087,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007889862.653, "dur": 19.171, + "args": { + "External id": 446088,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007889883.239, "dur": 14.755, + "args": { + "External id": 446089,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007889900.327, "dur": 12.420, + "args": { + "External id": 446090,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007889914.459, "dur": 11.911, + "args": { + "External id": 446091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007889928.445, "dur": 17.932, + "args": { + "External id": 446092,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007889930.236, "dur": 1.262, + "args": { + "External id": 446093,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889933.687, "dur": 0.756, + "args": { + "External id": 446094,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007889948.184, "dur": 12.187, + "args": { + "External id": 446095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007889961.381, "dur": 10.169, + "args": { + "External id": 446096,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007889979.532, "dur": 2.326, + "args": { + "External id": 446097,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007889990.922, "dur": 4.047, + "args": { + "External id": 446098,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007889993.434, "dur": 0.771, + "args": { + "External id": 446099,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007890059.381, "dur": 61.721, + "args": { + "External id": 446100,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007890127.571, "dur": 6.319, + "args": { + "External id": 446101,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890131.293, "dur": 1.080, + "args": { + "External id": 446102,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007890135.464, "dur": 23.917, + "args": { + "External id": 446103,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007890164.158, "dur": 6.263, + "args": { + "External id": 446104,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007890165.720, "dur": 3.998, + "args": { + "External id": 446105,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890167.779, "dur": 1.738, + "args": { + "External id": 446106,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007890173.607, "dur": 47.291, + "args": { + "External id": 446107,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007890175.172, "dur": 45.049, + "args": { + "External id": 446108,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007890224.771, "dur": 14.883, + "args": { + "External id": 446109,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007890245.324, "dur": 4.152, + "args": { + "External id": 446110,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890247.725, "dur": 0.791, + "args": { + "External id": 446111,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007890253.861, "dur": 46.857, + "args": { + "External id": 446112,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007890254.755, "dur": 4.265, + "args": { + "External id": 446113,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007890255.986, "dur": 2.492, + "args": { + "External id": 446114,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890257.753, "dur": 0.554, + "args": { + "External id": 446115,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007890259.808, "dur": 40.582, + "args": { + "External id": 446116,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007890260.600, "dur": 39.167, + "args": { + "External id": 446117,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007890304.693, "dur": 3.553, + "args": { + "External id": 446118,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890306.429, "dur": 0.634, + "args": { + "External id": 446119,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007890313.894, "dur": 1.672, + "args": { + "External id": 446120,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007890322.774, "dur": 8.415, + "args": { + "External id": 446121,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007890325.150, "dur": 5.727, + "args": { + "External id": 446122,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007890414.782, "dur": 171.359, + "args": { + "External id": 446123,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007890416.797, "dur": 2.193, + "args": { + "External id": 446124,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007890420.451, "dur": 165.255, + "args": { + "External id": 446125,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007890422.044, "dur": 0.341, + "args": { + "External id": 446126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007890423.743, "dur": 23.183, + "args": { + "External id": 446127,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007890448.235, "dur": 3.808, + "args": { + "External id": 446128,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890450.494, "dur": 1.323, + "args": { + "External id": 446129,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007890452.663, "dur": 24.160, + "args": { + "External id": 446130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007890453.582, "dur": 1.833, + "args": { + "External id": 446131,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007890456.468, "dur": 20.031, + "args": { + "External id": 446132,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007890461.748, "dur": 2.660, + "args": { + "External id": 446133,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007890478.260, "dur": 19.370, + "args": { + "External id": 446134,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007890498.992, "dur": 11.731, + "args": { + "External id": 446135,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007890513.724, "dur": 13.770, + "args": { + "External id": 446136,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007890528.843, "dur": 10.825, + "args": { + "External id": 446137,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007890541.325, "dur": 18.012, + "args": { + "External id": 446138,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007890542.904, "dur": 1.439, + "args": { + "External id": 446139,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890546.348, "dur": 0.994, + "args": { + "External id": 446140,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007890560.656, "dur": 10.812, + "args": { + "External id": 446141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007890572.478, "dur": 12.084, + "args": { + "External id": 446142,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007890591.985, "dur": 1.615, + "args": { + "External id": 446143,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007890601.932, "dur": 3.521, + "args": { + "External id": 446144,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890604.078, "dur": 0.581, + "args": { + "External id": 446145,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007890705.940, "dur": 48.416, + "args": { + "External id": 446146,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007890759.714, "dur": 6.386, + "args": { + "External id": 446147,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890763.231, "dur": 1.227, + "args": { + "External id": 446148,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "25165824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007890767.608, "dur": 25.148, + "args": { + "External id": 446149,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007890797.424, "dur": 6.828, + "args": { + "External id": 446150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007890799.321, "dur": 4.308, + "args": { + "External id": 446151,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890801.679, "dur": 1.740, + "args": { + "External id": 446152,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007890806.498, "dur": 41.625, + "args": { + "External id": 446153,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007890807.876, "dur": 39.560, + "args": { + "External id": 446154,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007890851.892, "dur": 16.548, + "args": { + "External id": 446155,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007890874.340, "dur": 3.898, + "args": { + "External id": 446156,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890876.554, "dur": 0.837, + "args": { + "External id": 446157,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007890882.014, "dur": 49.922, + "args": { + "External id": 446158,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007890883.223, "dur": 4.471, + "args": { + "External id": 446159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007890884.253, "dur": 2.918, + "args": { + "External id": 446160,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890886.074, "dur": 0.945, + "args": { + "External id": 446161,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007890888.355, "dur": 43.184, + "args": { + "External id": 446162,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007890889.471, "dur": 41.590, + "args": { + "External id": 446163,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007890935.664, "dur": 5.887, + "args": { + "External id": 446164,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007890937.422, "dur": 3.085, + "args": { + "External id": 446165,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007890947.691, "dur": 2.231, + "args": { + "External id": 446166,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007890957.538, "dur": 5.655, + "args": { + "External id": 446167,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007890959.565, "dur": 3.348, + "args": { + "External id": 446168,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007891053.357, "dur": 208.849, + "args": { + "External id": 446169,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007891055.502, "dur": 2.355, + "args": { + "External id": 446170,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007891059.411, "dur": 202.329, + "args": { + "External id": 446171,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007891061.209, "dur": 0.608, + "args": { + "External id": 446172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007891063.260, "dur": 40.069, + "args": { + "External id": 446173,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007891106.279, "dur": 3.803, + "args": { + "External id": 446174,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891108.520, "dur": 1.264, + "args": { + "External id": 446175,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007891111.070, "dur": 27.815, + "args": { + "External id": 446176,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007891112.252, "dur": 2.175, + "args": { + "External id": 446177,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007891115.724, "dur": 22.893, + "args": { + "External id": 446178,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007891121.972, "dur": 2.718, + "args": { + "External id": 446179,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007891140.331, "dur": 21.560, + "args": { + "External id": 446180,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007891163.217, "dur": 14.027, + "args": { + "External id": 446181,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007891179.785, "dur": 13.560, + "args": { + "External id": 446182,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007891194.933, "dur": 13.692, + "args": { + "External id": 446183,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007891210.760, "dur": 22.769, + "args": { + "External id": 446184,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007891212.883, "dur": 1.997, + "args": { + "External id": 446185,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891217.463, "dur": 0.828, + "args": { + "External id": 446186,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007891235.218, "dur": 13.473, + "args": { + "External id": 446187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007891249.934, "dur": 10.663, + "args": { + "External id": 446188,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007891269.500, "dur": 2.064, + "args": { + "External id": 446189,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007891280.359, "dur": 4.001, + "args": { + "External id": 446190,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891283.080, "dur": 0.564, + "args": { + "External id": 446191,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007891355.697, "dur": 45.583, + "args": { + "External id": 446192,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007891405.976, "dur": 5.310, + "args": { + "External id": 446193,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891408.993, "dur": 1.264, + "args": { + "External id": 446194,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007891412.520, "dur": 22.625, + "args": { + "External id": 446195,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007891439.655, "dur": 6.402, + "args": { + "External id": 446196,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007891441.450, "dur": 3.770, + "args": { + "External id": 446197,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891443.587, "dur": 1.442, + "args": { + "External id": 446198,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007891448.623, "dur": 42.583, + "args": { + "External id": 446199,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007891450.086, "dur": 40.390, + "args": { + "External id": 446200,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007891494.485, "dur": 14.908, + "args": { + "External id": 446201,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007891514.814, "dur": 4.333, + "args": { + "External id": 446202,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891517.301, "dur": 0.935, + "args": { + "External id": 446203,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007891522.628, "dur": 49.565, + "args": { + "External id": 446204,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007891523.790, "dur": 5.669, + "args": { + "External id": 446205,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007891524.609, "dur": 4.288, + "args": { + "External id": 446206,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891526.444, "dur": 2.255, + "args": { + "External id": 446207,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007891530.287, "dur": 41.442, + "args": { + "External id": 446208,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007891530.953, "dur": 40.015, + "args": { + "External id": 446209,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007891576.100, "dur": 3.817, + "args": { + "External id": 446210,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891577.829, "dur": 0.913, + "args": { + "External id": 446211,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007891585.153, "dur": 1.554, + "args": { + "External id": 446212,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007891594.489, "dur": 6.933, + "args": { + "External id": 446213,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007891596.649, "dur": 4.500, + "args": { + "External id": 446214,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007891720.197, "dur": 178.091, + "args": { + "External id": 446215,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007891723.322, "dur": 3.046, + "args": { + "External id": 446216,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007891727.983, "dur": 169.875, + "args": { + "External id": 446217,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007891729.932, "dur": 0.529, + "args": { + "External id": 446218,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007891733.866, "dur": 21.236, + "args": { + "External id": 446219,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007891756.714, "dur": 3.788, + "args": { + "External id": 446220,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891758.967, "dur": 1.282, + "args": { + "External id": 446221,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007891761.312, "dur": 23.966, + "args": { + "External id": 446222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007891762.423, "dur": 3.891, + "args": { + "External id": 446223,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007891767.966, "dur": 16.871, + "args": { + "External id": 446224,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007891770.455, "dur": 2.332, + "args": { + "External id": 446225,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007891787.025, "dur": 19.221, + "args": { + "External id": 446226,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007891807.607, "dur": 12.090, + "args": { + "External id": 446227,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007891822.759, "dur": 12.968, + "args": { + "External id": 446228,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007891837.494, "dur": 11.845, + "args": { + "External id": 446229,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007891851.291, "dur": 18.797, + "args": { + "External id": 446230,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007891853.183, "dur": 1.486, + "args": { + "External id": 446231,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891856.847, "dur": 0.837, + "args": { + "External id": 446232,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007891871.610, "dur": 11.652, + "args": { + "External id": 446233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007891884.662, "dur": 12.316, + "args": { + "External id": 446234,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007891904.632, "dur": 1.908, + "args": { + "External id": 446235,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007891932.310, "dur": 3.976, + "args": { + "External id": 446236,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007891934.972, "dur": 0.467, + "args": { + "External id": 446237,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007892003.464, "dur": 45.486, + "args": { + "External id": 446238,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007892053.750, "dur": 6.917, + "args": { + "External id": 446239,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892056.359, "dur": 3.172, + "args": { + "External id": 446240,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "41943040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007892062.192, "dur": 39.426, + "args": { + "External id": 446241,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007892108.005, "dur": 6.727, + "args": { + "External id": 446242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007892109.756, "dur": 4.230, + "args": { + "External id": 446243,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892112.576, "dur": 1.109, + "args": { + "External id": 446244,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007892118.173, "dur": 45.480, + "args": { + "External id": 446245,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007892119.642, "dur": 43.448, + "args": { + "External id": 446246,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007892167.476, "dur": 16.235, + "args": { + "External id": 446247,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007892189.550, "dur": 4.403, + "args": { + "External id": 446248,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892191.914, "dur": 1.101, + "args": { + "External id": 446249,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007892198.217, "dur": 75.129, + "args": { + "External id": 446250,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007892199.410, "dur": 4.213, + "args": { + "External id": 446251,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007892200.515, "dur": 2.556, + "args": { + "External id": 446252,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892202.115, "dur": 0.789, + "args": { + "External id": 446253,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007892204.149, "dur": 68.850, + "args": { + "External id": 446254,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007892205.401, "dur": 66.963, + "args": { + "External id": 446255,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007892277.361, "dur": 3.544, + "args": { + "External id": 446256,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892279.054, "dur": 0.895, + "args": { + "External id": 446257,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007892286.436, "dur": 1.788, + "args": { + "External id": 446258,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007892296.432, "dur": 6.739, + "args": { + "External id": 446259,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007892298.128, "dur": 4.787, + "args": { + "External id": 446260,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007892384.711, "dur": 178.150, + "args": { + "External id": 446261,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007892386.497, "dur": 4.175, + "args": { + "External id": 446262,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007892392.192, "dur": 170.159, + "args": { + "External id": 446263,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007892393.762, "dur": 0.619, + "args": { + "External id": 446264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007892395.802, "dur": 20.792, + "args": { + "External id": 446265,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007892418.604, "dur": 5.222, + "args": { + "External id": 446266,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892422.594, "dur": 0.993, + "args": { + "External id": 446267,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007892424.659, "dur": 21.779, + "args": { + "External id": 446268,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007892425.611, "dur": 1.695, + "args": { + "External id": 446269,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007892428.660, "dur": 17.478, + "args": { + "External id": 446270,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007892431.417, "dur": 2.262, + "args": { + "External id": 446271,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007892447.980, "dur": 20.229, + "args": { + "External id": 446272,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007892469.235, "dur": 13.823, + "args": { + "External id": 446273,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007892485.413, "dur": 13.167, + "args": { + "External id": 446274,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007892500.057, "dur": 11.485, + "args": { + "External id": 446275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007892513.345, "dur": 21.329, + "args": { + "External id": 446276,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007892517.783, "dur": 1.400, + "args": { + "External id": 446277,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892521.370, "dur": 0.812, + "args": { + "External id": 446278,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007892536.166, "dur": 13.181, + "args": { + "External id": 446279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007892550.704, "dur": 10.703, + "args": { + "External id": 446280,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007892568.658, "dur": 1.602, + "args": { + "External id": 446281,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007892578.140, "dur": 3.777, + "args": { + "External id": 446282,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892580.369, "dur": 0.557, + "args": { + "External id": 446283,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007892643.709, "dur": 80.982, + "args": { + "External id": 446284,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007892731.422, "dur": 6.637, + "args": { + "External id": 446285,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892734.764, "dur": 1.354, + "args": { + "External id": 446286,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007892739.266, "dur": 23.937, + "args": { + "External id": 446287,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007892768.126, "dur": 7.039, + "args": { + "External id": 446288,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007892769.913, "dur": 4.642, + "args": { + "External id": 446289,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892772.731, "dur": 1.624, + "args": { + "External id": 446290,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007892778.275, "dur": 42.636, + "args": { + "External id": 446291,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007892780.055, "dur": 40.226, + "args": { + "External id": 446292,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007892824.301, "dur": 15.247, + "args": { + "External id": 446293,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007892844.946, "dur": 3.601, + "args": { + "External id": 446294,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892847.097, "dur": 0.607, + "args": { + "External id": 446295,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 4183441, "tid": 4183441, + "ts": 676007892852.537, "dur": 46.881, + "args": { + "External id": 446296,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [32000, 1024], []], "Ev Idx": 8519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007892853.679, "dur": 4.165, + "args": { + "External id": 446297,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007892854.586, "dur": 2.693, + "args": { + "External id": 446298,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], []], "Input Dims": [[32000, 1024], [], []], "Ev Idx": 8521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892856.320, "dur": 0.811, + "args": { + "External id": 446299,"Record function id": 0, "Concrete Inputs": ["", "[1024, 32000]", "[1, 1024]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[32000, 1024], [], [], []], "Ev Idx": 8522 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007892858.817, "dur": 40.231, + "args": { + "External id": 446300,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8523 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007892859.532, "dur": 38.894, + "args": { + "External id": 446301,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1024, 1], [1, 1024]], "Input Dims": [[8192, 1024], [1024, 32000]], "Ev Idx": 8524 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007892903.565, "dur": 3.963, + "args": { + "External id": 446302,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8525 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007892905.559, "dur": 1.038, + "args": { + "External id": 446303,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8526 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007892913.505, "dur": 1.506, + "args": { + "External id": 446304,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8527 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 4183441, "tid": 4183441, + "ts": 676007892922.884, "dur": 6.239, + "args": { + "External id": 446305,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8528 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007892924.762, "dur": 4.100, + "args": { + "External id": 446306,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8529 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007893005.974, "dur": 196.160, + "args": { + "External id": 446307,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8530 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007893010.580, "dur": 2.210, + "args": { + "External id": 446308,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8531 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 4183441, "tid": 4183441, + "ts": 676007893013.993, "dur": 187.658, + "args": { + "External id": 446309,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8532 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 4183441, "tid": 4183441, + "ts": 676007893015.695, "dur": 0.284, + "args": { + "External id": 446310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8533 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 4183441, "tid": 4183441, + "ts": 676007893017.381, "dur": 19.775, + "args": { + "External id": 446311,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8534 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 4183441, "tid": 4183441, + "ts": 676007893038.706, "dur": 5.267, + "args": { + "External id": 446312,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8535 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893042.788, "dur": 0.952, + "args": { + "External id": 446313,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8536 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007893045.008, "dur": 19.890, + "args": { + "External id": 446314,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8537 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676007893046.197, "dur": 1.808, + "args": { + "External id": 446315,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8538 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676007893049.364, "dur": 15.309, + "args": { + "External id": 446316,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8539 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007893051.970, "dur": 2.001, + "args": { + "External id": 446317,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8540 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676007893066.385, "dur": 36.409, + "args": { + "External id": 446318,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8541 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007893105.066, "dur": 15.463, + "args": { + "External id": 446319,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8542 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 4183441, "tid": 4183441, + "ts": 676007893123.721, "dur": 13.827, + "args": { + "External id": 446320,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8543 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 4183441, "tid": 4183441, + "ts": 676007893139.048, "dur": 11.165, + "args": { + "External id": 446321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8544 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007893152.402, "dur": 20.026, + "args": { + "External id": 446322,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8545 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676007893154.502, "dur": 2.236, + "args": { + "External id": 446323,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8546 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893159.053, "dur": 1.061, + "args": { + "External id": 446324,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8547 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 4183441, "tid": 4183441, + "ts": 676007893173.933, "dur": 13.231, + "args": { + "External id": 446325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8548 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007893188.446, "dur": 12.184, + "args": { + "External id": 446326,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8549 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676007893209.229, "dur": 2.149, + "args": { + "External id": 446327,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8550 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007893220.776, "dur": 3.529, + "args": { + "External id": 446328,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8551 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893222.840, "dur": 0.649, + "args": { + "External id": 446329,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8552 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007893286.907, "dur": 41.877, + "args": { + "External id": 446330,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [1024, 1]], "Input Dims": [[8192, 32000], [32000, 1024]], "Ev Idx": 8553 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 4183441, "tid": 4183441, + "ts": 676007893333.006, "dur": 14.616, + "args": { + "External id": 446331,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1024, 1], [], [], [], []], "Input Dims": [[65536, 1024], [], [], [], []], "Ev Idx": 8554 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893345.382, "dur": 0.952, + "args": { + "External id": 446332,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1024]", "[1024, 1]", "58720256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1024, 1], [], [], []], "Input Dims": [[65536, 1024], [], [], []], "Ev Idx": 8555 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007893348.927, "dur": 21.044, + "args": { + "External id": 446333,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[8192, 1024], [8192, 1024], []], "Ev Idx": 8556 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 4183441, "tid": 4183441, + "ts": 676007893374.335, "dur": 7.770, + "args": { + "External id": 446334,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8557 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 4183441, "tid": 4183441, + "ts": 676007893376.044, "dur": 5.463, + "args": { + "External id": 446335,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8558 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893378.127, "dur": 3.150, + "args": { + "External id": 446336,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8559 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 4183441, "tid": 4183441, + "ts": 676007893384.495, "dur": 39.251, + "args": { + "External id": 446337,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8560 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 4183441, "tid": 4183441, + "ts": 676007893385.668, "dur": 37.162, + "args": { + "External id": 446338,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [1024, 1]], "Input Dims": [[32000, 8192], [8192, 1024]], "Ev Idx": 8561 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007893426.881, "dur": 13.003, + "args": { + "External id": 446339,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8562 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007893444.453, "dur": 22.562, + "args": { + "External id": 446340,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8563 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 4183441, "tid": 4183441, + "ts": 676007893446.799, "dur": 19.812, + "args": { + "External id": 446341,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8564 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893451.799, "dur": 1.358, + "args": { + "External id": 446342,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8565 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676007893471.800, "dur": 24.477, + "args": { + "External id": 446343,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], []], "Ev Idx": 8566 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 4183441, "tid": 4183441, + "ts": 676007893473.524, "dur": 22.542, + "args": { + "External id": 446344,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1024, 1], [], [], [], [], [], []], "Input Dims": [[32000, 1024], [], [], [], [], [], []], "Ev Idx": 8567 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893477.745, "dur": 3.947, + "args": { + "External id": 446345,"Record function id": 0, "Concrete Inputs": ["[32000, 1024]", "[1024, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8568 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676007893482.974, "dur": 12.573, + "args": { + "External id": 446346,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[1024, 1], [1024, 1], []], "Input Dims": [[32000, 1024], [32000, 1024], []], "Ev Idx": 8569 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007893507.263, "dur": 5.071, + "args": { + "External id": 446347,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8570 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007893509.454, "dur": 2.599, + "args": { + "External id": 446348,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[65536, 1024]], "Ev Idx": 8571 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 4183441, "tid": 4183441, + "ts": 676007893513.332, "dur": 1.576, + "args": { + "External id": 446349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8572 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 4183441, "tid": 4183441, + "ts": 676007893514.112, "dur": 0.724, + "args": { + "External id": 446350,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1024, 1]], "Input Dims": [[32000, 1024]], "Ev Idx": 8573 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007893556.680, "dur": 21.310, + "args": { + "External id": 446351,"Sequence number": 5285600, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8574 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 4183441, "tid": 4183441, + "ts": 676007893580.120, "dur": 12.655, + "args": { + "External id": 446352,"Sequence number": 5285601, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8575 + } + }, + { + "ph": "s", "id": 2, "pid": 4183441, "tid": 4183441, "ts": 676007893580.120, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward", "pid": 4183441, "tid": 4183441, + "ts": 676007893740.804, "dur": 42.080, + "args": { + "External id": 446353,"Record function id": 0, "Ev Idx": 8576 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183441, "tid": 4183441, + "ts": 676007893886.291, "dur": 38.611, + "args": { + "External id": 446354,"Sequence number": 5285602, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8577 + } + }, + { + "ph": "s", "id": 1, "pid": 4183441, "tid": 4183441, "ts": 676007893886.291, + "cat": "fwdbwd", "name": "fwdbwd" + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ones_like", "pid": 4183441, "tid": 4183441, + "ts": 676007893986.210, "dur": 30.585, + "args": { + "External id": 446355,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 8578 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676007893988.130, "dur": 8.927, + "args": { + "External id": 446356,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 8579 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 4183441, "tid": 4183441, + "ts": 676007893992.187, "dur": 4.271, + "args": { + "External id": 446357,"Record function id": 0, "Concrete Inputs": ["[1]", "[1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8580 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676007893998.856, "dur": 17.584, + "args": { + "External id": 446358,"Record function id": 0, "Concrete Inputs": ["", "1."], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8581 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183441, "tid": 4183441, + "ts": 676008340917.643, "dur": 57.704, + "args": { + "External id": 446359,"Sequence number": 5285603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8582 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 4183441, "tid": 4183441, + "ts": 676008340983.420, "dur": 20.775, + "args": { + "External id": 446360,"Sequence number": 5285604, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8583 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676008341157.387, "dur": 29.694, + "args": { + "External id": 446361,"Sequence number": 5285605, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8584 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676008341707.524, "dur": 29.346, + "args": { + "External id": 446362,"Sequence number": 5285606, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 8585 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676008341743.706, "dur": 14.289, + "args": { + "External id": 446363,"Sequence number": 5285607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 8586 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 4183441, "tid": 4183441, + "ts": 676008343510.105, "dur": 2419.026, + "args": { + "External id": 446364,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 8587 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 4183441, "tid": 4183441, + "ts": 676008344013.125, "dur": 744.670, + "args": { + "External id": 446365,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 8588 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 4183441, "tid": 4183441, + "ts": 676008344031.117, "dur": 78.674, + "args": { + "External id": 446366,"Record function id": 0, "Concrete Inputs": ["[13797]", "6", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8589 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676008344034.846, "dur": 12.798, + "args": { + "External id": 446367,"Record function id": 0, "Concrete Inputs": ["[13797]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8590 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 4183441, "tid": 4183441, + "ts": 676008344050.948, "dur": 58.537, + "args": { + "External id": 446368,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[13797]], "Ev Idx": 8591 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 4183441, "tid": 4183441, + "ts": 676008344053.418, "dur": 55.134, + "args": { + "External id": 446369,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[13797], []], "Ev Idx": 8592 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345957.816, "dur": 4.267, + "args": { + "External id": 446370,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8593 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345964.032, "dur": 0.374, + "args": { + "External id": 446371,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8594 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345966.043, "dur": 0.502, + "args": { + "External id": 446372,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8595 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345967.909, "dur": 0.463, + "args": { + "External id": 446373,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8596 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345969.810, "dur": 0.463, + "args": { + "External id": 446374,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8597 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345971.457, "dur": 0.402, + "args": { + "External id": 446375,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8598 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345973.007, "dur": 0.434, + "args": { + "External id": 446376,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8599 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345976.081, "dur": 0.482, + "args": { + "External id": 446377,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8600 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345977.639, "dur": 0.433, + "args": { + "External id": 446378,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8601 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345979.154, "dur": 0.511, + "args": { + "External id": 446379,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8602 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345980.765, "dur": 0.488, + "args": { + "External id": 446380,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8603 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345982.289, "dur": 0.452, + "args": { + "External id": 446381,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8604 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345983.557, "dur": 0.436, + "args": { + "External id": 446382,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8605 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345984.987, "dur": 0.231, + "args": { + "External id": 446383,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8606 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345986.044, "dur": 0.226, + "args": { + "External id": 446384,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8607 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345988.452, "dur": 0.237, + "args": { + "External id": 446385,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8608 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345989.511, "dur": 0.232, + "args": { + "External id": 446386,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8609 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345990.712, "dur": 0.235, + "args": { + "External id": 446387,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8610 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345991.730, "dur": 0.224, + "args": { + "External id": 446388,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8611 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345992.820, "dur": 0.221, + "args": { + "External id": 446389,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8612 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345993.864, "dur": 0.237, + "args": { + "External id": 446390,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8613 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345995.004, "dur": 0.219, + "args": { + "External id": 446391,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8614 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345996.086, "dur": 0.235, + "args": { + "External id": 446392,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8615 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008345998.938, "dur": 0.221, + "args": { + "External id": 446393,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8616 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346000.169, "dur": 0.221, + "args": { + "External id": 446394,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8617 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346001.237, "dur": 0.213, + "args": { + "External id": 446395,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8618 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346002.422, "dur": 0.229, + "args": { + "External id": 446396,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8619 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346003.628, "dur": 0.243, + "args": { + "External id": 446397,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8620 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346004.628, "dur": 0.242, + "args": { + "External id": 446398,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8621 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346005.677, "dur": 0.237, + "args": { + "External id": 446399,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8622 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346006.650, "dur": 0.218, + "args": { + "External id": 446400,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8623 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346009.577, "dur": 0.227, + "args": { + "External id": 446401,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8624 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346010.544, "dur": 0.208, + "args": { + "External id": 446402,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8625 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346011.887, "dur": 0.231, + "args": { + "External id": 446403,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8626 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346012.905, "dur": 0.216, + "args": { + "External id": 446404,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8627 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346013.997, "dur": 0.249, + "args": { + "External id": 446405,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8628 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346015.179, "dur": 0.236, + "args": { + "External id": 446406,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8629 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346016.353, "dur": 0.230, + "args": { + "External id": 446407,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8630 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346017.474, "dur": 0.233, + "args": { + "External id": 446408,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8631 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346019.667, "dur": 0.455, + "args": { + "External id": 446409,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8632 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346020.920, "dur": 0.258, + "args": { + "External id": 446410,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8633 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346022.065, "dur": 0.451, + "args": { + "External id": 446411,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8634 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346023.436, "dur": 0.482, + "args": { + "External id": 446412,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8635 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346024.749, "dur": 0.229, + "args": { + "External id": 446413,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8636 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346025.781, "dur": 0.230, + "args": { + "External id": 446414,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8637 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346026.830, "dur": 0.442, + "args": { + "External id": 446415,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8638 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346028.148, "dur": 0.453, + "args": { + "External id": 446416,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8639 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346032.016, "dur": 0.233, + "args": { + "External id": 446417,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8640 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346033.222, "dur": 0.220, + "args": { + "External id": 446418,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8641 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346034.195, "dur": 0.241, + "args": { + "External id": 446419,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8642 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346035.199, "dur": 0.239, + "args": { + "External id": 446420,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8643 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346036.303, "dur": 0.246, + "args": { + "External id": 446421,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8644 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346037.375, "dur": 0.224, + "args": { + "External id": 446422,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8645 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346038.452, "dur": 0.227, + "args": { + "External id": 446423,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8646 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346039.562, "dur": 0.233, + "args": { + "External id": 446424,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8647 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346042.338, "dur": 0.227, + "args": { + "External id": 446425,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8648 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346043.327, "dur": 0.214, + "args": { + "External id": 446426,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8649 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346044.359, "dur": 0.198, + "args": { + "External id": 446427,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8650 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346045.306, "dur": 0.229, + "args": { + "External id": 446428,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8651 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346046.264, "dur": 0.221, + "args": { + "External id": 446429,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8652 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346047.215, "dur": 0.246, + "args": { + "External id": 446430,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8653 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346048.281, "dur": 0.239, + "args": { + "External id": 446431,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8654 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346049.293, "dur": 0.239, + "args": { + "External id": 446432,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8655 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346051.027, "dur": 0.220, + "args": { + "External id": 446433,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8656 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346052.226, "dur": 0.243, + "args": { + "External id": 446434,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8657 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346053.415, "dur": 0.226, + "args": { + "External id": 446435,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8658 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346054.429, "dur": 0.237, + "args": { + "External id": 446436,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8659 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346055.448, "dur": 0.223, + "args": { + "External id": 446437,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8660 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346056.468, "dur": 0.217, + "args": { + "External id": 446438,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8661 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346057.420, "dur": 0.399, + "args": { + "External id": 446439,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8662 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346058.561, "dur": 0.433, + "args": { + "External id": 446440,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8663 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346061.069, "dur": 0.414, + "args": { + "External id": 446441,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8664 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346062.287, "dur": 0.451, + "args": { + "External id": 446442,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8665 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346063.481, "dur": 0.446, + "args": { + "External id": 446443,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8666 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346064.674, "dur": 0.235, + "args": { + "External id": 446444,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8667 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346065.702, "dur": 0.220, + "args": { + "External id": 446445,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8668 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346066.762, "dur": 0.356, + "args": { + "External id": 446446,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8669 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346068.762, "dur": 0.430, + "args": { + "External id": 446447,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8670 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346070.187, "dur": 0.220, + "args": { + "External id": 446448,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8671 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346073.042, "dur": 0.227, + "args": { + "External id": 446449,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8672 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346074.133, "dur": 0.425, + "args": { + "External id": 446450,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8673 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346075.451, "dur": 0.450, + "args": { + "External id": 446451,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8674 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346076.655, "dur": 0.401, + "args": { + "External id": 446452,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8675 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346077.959, "dur": 0.216, + "args": { + "External id": 446453,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8676 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346079.046, "dur": 0.221, + "args": { + "External id": 446454,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8677 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346080.029, "dur": 0.404, + "args": { + "External id": 446455,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8678 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346091.842, "dur": 0.824, + "args": { + "External id": 446456,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8679 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346097.059, "dur": 0.221, + "args": { + "External id": 446457,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8680 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346098.500, "dur": 0.217, + "args": { + "External id": 446458,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8681 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346099.733, "dur": 0.213, + "args": { + "External id": 446459,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8682 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346100.918, "dur": 0.228, + "args": { + "External id": 446460,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8683 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346102.038, "dur": 0.225, + "args": { + "External id": 446461,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8684 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346103.158, "dur": 0.274, + "args": { + "External id": 446462,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8685 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346105.155, "dur": 0.431, + "args": { + "External id": 446463,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8686 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346106.671, "dur": 0.573, + "args": { + "External id": 446464,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8687 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346127.205, "dur": 0.269, + "args": { + "External id": 451073,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8688 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346128.462, "dur": 0.271, + "args": { + "External id": 451074,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8689 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346129.611, "dur": 0.215, + "args": { + "External id": 451075,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8690 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346130.621, "dur": 0.238, + "args": { + "External id": 451076,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8691 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346131.604, "dur": 0.253, + "args": { + "External id": 451077,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8692 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346132.680, "dur": 0.226, + "args": { + "External id": 451078,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8693 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346133.653, "dur": 0.250, + "args": { + "External id": 451079,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8694 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346134.643, "dur": 0.218, + "args": { + "External id": 451080,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8695 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346136.795, "dur": 0.218, + "args": { + "External id": 451081,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8696 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346137.788, "dur": 0.215, + "args": { + "External id": 451082,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8697 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346138.736, "dur": 0.220, + "args": { + "External id": 451083,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8698 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346139.743, "dur": 0.221, + "args": { + "External id": 451084,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8699 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346140.804, "dur": 0.220, + "args": { + "External id": 451085,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8700 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346141.836, "dur": 0.228, + "args": { + "External id": 451086,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8701 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346143.269, "dur": 0.205, + "args": { + "External id": 451087,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8702 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346144.264, "dur": 0.220, + "args": { + "External id": 451088,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8703 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346146.942, "dur": 0.214, + "args": { + "External id": 451089,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8704 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346147.882, "dur": 0.227, + "args": { + "External id": 451090,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8705 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346148.882, "dur": 0.244, + "args": { + "External id": 451091,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8706 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346149.901, "dur": 0.216, + "args": { + "External id": 451092,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8707 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346150.906, "dur": 0.222, + "args": { + "External id": 451093,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8708 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346151.919, "dur": 0.210, + "args": { + "External id": 451094,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8709 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346152.869, "dur": 0.214, + "args": { + "External id": 451095,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8710 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346157.703, "dur": 0.213, + "args": { + "External id": 451096,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8711 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346160.134, "dur": 0.226, + "args": { + "External id": 451097,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8712 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346161.120, "dur": 0.242, + "args": { + "External id": 451098,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8713 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346162.102, "dur": 0.218, + "args": { + "External id": 451099,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8714 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346163.096, "dur": 0.207, + "args": { + "External id": 451100,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8715 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346164.141, "dur": 0.220, + "args": { + "External id": 451101,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8716 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346165.139, "dur": 0.202, + "args": { + "External id": 451102,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8717 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346166.066, "dur": 0.220, + "args": { + "External id": 451103,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8718 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346167.041, "dur": 0.214, + "args": { + "External id": 451104,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8719 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346169.176, "dur": 0.237, + "args": { + "External id": 451105,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8720 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346170.136, "dur": 0.213, + "args": { + "External id": 451106,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8721 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346171.715, "dur": 0.229, + "args": { + "External id": 451107,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8722 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346172.713, "dur": 0.219, + "args": { + "External id": 451108,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8723 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346173.720, "dur": 0.221, + "args": { + "External id": 451109,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8724 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346174.702, "dur": 0.236, + "args": { + "External id": 451110,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8725 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346175.724, "dur": 0.229, + "args": { + "External id": 451111,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8726 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346176.764, "dur": 0.246, + "args": { + "External id": 451112,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8727 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346178.665, "dur": 0.215, + "args": { + "External id": 451113,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8728 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346179.604, "dur": 0.231, + "args": { + "External id": 451114,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8729 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346180.577, "dur": 0.224, + "args": { + "External id": 451115,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8730 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346181.540, "dur": 0.221, + "args": { + "External id": 451116,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8731 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346182.556, "dur": 0.221, + "args": { + "External id": 451117,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8732 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346183.647, "dur": 0.217, + "args": { + "External id": 451118,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8733 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346184.583, "dur": 0.218, + "args": { + "External id": 451119,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8734 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346185.523, "dur": 0.220, + "args": { + "External id": 451120,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8735 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346187.627, "dur": 0.216, + "args": { + "External id": 451121,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8736 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346188.591, "dur": 0.211, + "args": { + "External id": 451122,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8737 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346189.613, "dur": 0.236, + "args": { + "External id": 451123,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8738 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346190.718, "dur": 0.223, + "args": { + "External id": 451124,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8739 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346191.686, "dur": 0.221, + "args": { + "External id": 451125,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8740 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346192.791, "dur": 0.222, + "args": { + "External id": 451126,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8741 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346194.200, "dur": 0.326, + "args": { + "External id": 451127,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8742 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346195.311, "dur": 0.224, + "args": { + "External id": 451128,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8743 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346198.340, "dur": 0.250, + "args": { + "External id": 451129,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8744 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346199.344, "dur": 0.228, + "args": { + "External id": 451130,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8745 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346200.348, "dur": 0.224, + "args": { + "External id": 451131,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8746 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346201.433, "dur": 0.222, + "args": { + "External id": 451132,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8747 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346202.433, "dur": 0.220, + "args": { + "External id": 451133,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8748 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346203.519, "dur": 0.247, + "args": { + "External id": 451134,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8749 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346204.504, "dur": 0.217, + "args": { + "External id": 451135,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8750 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346205.491, "dur": 0.218, + "args": { + "External id": 451136,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8751 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346208.215, "dur": 0.221, + "args": { + "External id": 451137,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8752 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346209.283, "dur": 0.231, + "args": { + "External id": 451138,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8753 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346211.906, "dur": 0.230, + "args": { + "External id": 451139,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8754 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346212.914, "dur": 0.213, + "args": { + "External id": 451140,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8755 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346213.931, "dur": 0.223, + "args": { + "External id": 451141,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8756 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346215.051, "dur": 0.225, + "args": { + "External id": 451142,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8757 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346216.007, "dur": 0.220, + "args": { + "External id": 451143,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8758 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346217.128, "dur": 0.223, + "args": { + "External id": 451144,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8759 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346219.792, "dur": 0.215, + "args": { + "External id": 451145,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8760 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346220.734, "dur": 0.224, + "args": { + "External id": 451146,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8761 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346221.737, "dur": 0.213, + "args": { + "External id": 451147,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8762 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346222.818, "dur": 0.223, + "args": { + "External id": 451148,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8763 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346223.773, "dur": 0.215, + "args": { + "External id": 451149,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8764 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346224.791, "dur": 0.221, + "args": { + "External id": 451150,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8765 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346226.127, "dur": 0.229, + "args": { + "External id": 451151,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8766 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346227.083, "dur": 0.214, + "args": { + "External id": 451152,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8767 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346229.827, "dur": 0.218, + "args": { + "External id": 451153,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8768 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346230.764, "dur": 0.215, + "args": { + "External id": 451154,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8769 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346231.704, "dur": 0.219, + "args": { + "External id": 451155,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8770 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346232.699, "dur": 0.218, + "args": { + "External id": 451156,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8771 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346233.674, "dur": 0.222, + "args": { + "External id": 451157,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8772 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346234.692, "dur": 0.216, + "args": { + "External id": 451158,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8773 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346235.726, "dur": 0.226, + "args": { + "External id": 451159,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8774 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346236.704, "dur": 0.224, + "args": { + "External id": 451160,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8775 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346239.426, "dur": 0.215, + "args": { + "External id": 451161,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8776 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346240.366, "dur": 0.211, + "args": { + "External id": 451162,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8777 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346241.344, "dur": 0.244, + "args": { + "External id": 451163,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8778 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346242.418, "dur": 0.211, + "args": { + "External id": 451164,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8779 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346243.528, "dur": 0.256, + "args": { + "External id": 451165,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8780 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346244.598, "dur": 0.233, + "args": { + "External id": 451166,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8781 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346245.620, "dur": 0.220, + "args": { + "External id": 451167,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8782 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346246.768, "dur": 0.222, + "args": { + "External id": 451168,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8783 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346249.227, "dur": 0.212, + "args": { + "External id": 451169,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8784 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346250.263, "dur": 0.222, + "args": { + "External id": 451170,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8785 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346251.243, "dur": 0.214, + "args": { + "External id": 451171,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8786 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346252.183, "dur": 0.220, + "args": { + "External id": 451172,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8787 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346253.116, "dur": 0.212, + "args": { + "External id": 451173,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8788 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346254.068, "dur": 0.224, + "args": { + "External id": 451174,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8789 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346255.006, "dur": 0.217, + "args": { + "External id": 451175,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8790 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346256.043, "dur": 0.228, + "args": { + "External id": 451176,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8791 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346258.684, "dur": 0.217, + "args": { + "External id": 451177,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8792 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346259.692, "dur": 0.217, + "args": { + "External id": 451178,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8793 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346261.032, "dur": 0.239, + "args": { + "External id": 451179,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8794 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346262.165, "dur": 0.230, + "args": { + "External id": 451180,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8795 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346270.420, "dur": 0.233, + "args": { + "External id": 451181,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8796 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346271.419, "dur": 0.223, + "args": { + "External id": 451182,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8797 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346272.402, "dur": 0.218, + "args": { + "External id": 451183,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8798 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346273.339, "dur": 0.216, + "args": { + "External id": 451184,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8799 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346275.496, "dur": 0.223, + "args": { + "External id": 451185,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8800 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346276.511, "dur": 0.210, + "args": { + "External id": 451186,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8801 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346277.542, "dur": 0.216, + "args": { + "External id": 451187,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8802 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346278.496, "dur": 0.221, + "args": { + "External id": 451188,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8803 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346279.441, "dur": 0.218, + "args": { + "External id": 451189,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8804 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346280.369, "dur": 0.227, + "args": { + "External id": 451190,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8805 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346281.345, "dur": 0.215, + "args": { + "External id": 451191,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8806 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346282.311, "dur": 0.220, + "args": { + "External id": 451192,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8807 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346284.692, "dur": 0.230, + "args": { + "External id": 451193,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8808 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346285.796, "dur": 0.245, + "args": { + "External id": 451194,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8809 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346286.808, "dur": 0.221, + "args": { + "External id": 451195,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8810 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008346287.769, "dur": 0.225, + "args": { + "External id": 451196,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 8811 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 4183441, "tid": 4183441, + "ts": 676008346331.634, "dur": 1131.005, + "args": { + "External id": 451197,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8812 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 4183441, "tid": 4183441, + "ts": 676008346710.889, "dur": 684.957, + "args": { + "External id": 451198,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8813 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346717.670, "dur": 7.651, + "args": { + "External id": 451199,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8814 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346721.871, "dur": 2.836, + "args": { + "External id": 451200,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8815 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346725.932, "dur": 2.848, + "args": { + "External id": 451201,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8816 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346726.621, "dur": 2.068, + "args": { + "External id": 451202,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8817 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346729.143, "dur": 2.761, + "args": { + "External id": 451203,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8818 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346731.073, "dur": 0.756, + "args": { + "External id": 451204,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8819 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346732.149, "dur": 1.446, + "args": { + "External id": 451205,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8820 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346732.619, "dur": 0.788, + "args": { + "External id": 451206,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8821 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346735.116, "dur": 4.428, + "args": { + "External id": 451207,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8822 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346739.090, "dur": 0.385, + "args": { + "External id": 451208,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8823 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346739.845, "dur": 1.250, + "args": { + "External id": 451209,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8824 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346740.244, "dur": 0.785, + "args": { + "External id": 451210,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8825 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346741.342, "dur": 0.946, + "args": { + "External id": 451211,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8826 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346741.730, "dur": 0.490, + "args": { + "External id": 451212,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8827 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346742.515, "dur": 6.319, + "args": { + "External id": 451213,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8828 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346748.094, "dur": 0.653, + "args": { + "External id": 451214,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8829 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346749.088, "dur": 1.249, + "args": { + "External id": 451215,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8830 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346749.597, "dur": 0.674, + "args": { + "External id": 451216,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8831 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346750.568, "dur": 2.833, + "args": { + "External id": 451217,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8832 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346750.928, "dur": 2.403, + "args": { + "External id": 451218,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8833 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346753.648, "dur": 2.575, + "args": { + "External id": 451219,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8834 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346755.333, "dur": 0.821, + "args": { + "External id": 451220,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8835 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346756.654, "dur": 1.625, + "args": { + "External id": 451221,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8836 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346757.030, "dur": 1.180, + "args": { + "External id": 451222,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8837 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346759.668, "dur": 4.528, + "args": { + "External id": 451223,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8838 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346763.452, "dur": 0.664, + "args": { + "External id": 451224,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8839 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346764.461, "dur": 1.345, + "args": { + "External id": 451225,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8840 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346765.026, "dur": 0.605, + "args": { + "External id": 451226,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8841 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346766.055, "dur": 1.111, + "args": { + "External id": 451227,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8842 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346766.416, "dur": 0.681, + "args": { + "External id": 451228,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8843 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346767.392, "dur": 3.341, + "args": { + "External id": 451229,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8844 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346770.081, "dur": 0.590, + "args": { + "External id": 451230,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8845 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346770.965, "dur": 1.055, + "args": { + "External id": 451231,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8846 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346771.337, "dur": 0.420, + "args": { + "External id": 451232,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8847 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346772.285, "dur": 2.404, + "args": { + "External id": 451233,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8848 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346772.678, "dur": 1.928, + "args": { + "External id": 451234,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8849 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346774.937, "dur": 2.522, + "args": { + "External id": 451235,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8850 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346776.806, "dur": 0.593, + "args": { + "External id": 451236,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8851 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346777.687, "dur": 1.394, + "args": { + "External id": 451237,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8852 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346778.085, "dur": 0.931, + "args": { + "External id": 451238,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8853 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346780.682, "dur": 4.073, + "args": { + "External id": 451239,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8854 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346784.146, "dur": 0.545, + "args": { + "External id": 451240,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8855 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346785.006, "dur": 1.147, + "args": { + "External id": 451241,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8856 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346785.361, "dur": 0.722, + "args": { + "External id": 451242,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8857 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346786.406, "dur": 1.288, + "args": { + "External id": 451243,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8858 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346786.768, "dur": 0.663, + "args": { + "External id": 451244,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8859 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346787.926, "dur": 2.564, + "args": { + "External id": 451245,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8860 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346789.939, "dur": 0.485, + "args": { + "External id": 451246,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8861 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346790.718, "dur": 1.706, + "args": { + "External id": 451247,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8862 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346791.159, "dur": 1.085, + "args": { + "External id": 451248,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8863 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346792.664, "dur": 2.413, + "args": { + "External id": 451249,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8864 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346793.024, "dur": 1.858, + "args": { + "External id": 451250,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8865 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346795.312, "dur": 2.336, + "args": { + "External id": 451251,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8866 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346796.858, "dur": 0.721, + "args": { + "External id": 451252,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8867 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346797.878, "dur": 1.368, + "args": { + "External id": 451253,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8868 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346798.274, "dur": 0.898, + "args": { + "External id": 451254,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8869 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346800.879, "dur": 4.472, + "args": { + "External id": 451255,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8870 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346804.541, "dur": 0.743, + "args": { + "External id": 451256,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8871 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346805.798, "dur": 1.005, + "args": { + "External id": 451257,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8872 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346806.166, "dur": 0.562, + "args": { + "External id": 451258,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8873 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346807.030, "dur": 1.307, + "args": { + "External id": 451259,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8874 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346807.390, "dur": 0.798, + "args": { + "External id": 451260,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8875 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346808.564, "dur": 4.301, + "args": { + "External id": 451261,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8876 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346812.259, "dur": 0.362, + "args": { + "External id": 451262,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8877 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346813.113, "dur": 1.064, + "args": { + "External id": 451263,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8878 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346813.517, "dur": 0.596, + "args": { + "External id": 451264,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8879 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346814.404, "dur": 2.590, + "args": { + "External id": 451265,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8880 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346814.765, "dur": 2.156, + "args": { + "External id": 451266,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8881 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346817.221, "dur": 2.654, + "args": { + "External id": 451267,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8882 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346819.221, "dur": 0.585, + "args": { + "External id": 451268,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8883 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346820.104, "dur": 1.273, + "args": { + "External id": 451269,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8884 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346820.463, "dur": 0.653, + "args": { + "External id": 451270,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8885 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346822.304, "dur": 4.163, + "args": { + "External id": 451271,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8886 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346826.097, "dur": 0.300, + "args": { + "External id": 451272,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8887 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346826.742, "dur": 1.168, + "args": { + "External id": 451273,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8888 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346827.103, "dur": 0.740, + "args": { + "External id": 451274,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8889 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346828.138, "dur": 1.130, + "args": { + "External id": 451275,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8890 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346828.500, "dur": 0.702, + "args": { + "External id": 451276,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8891 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346829.505, "dur": 3.234, + "args": { + "External id": 451277,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8892 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346832.075, "dur": 0.601, + "args": { + "External id": 451278,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8893 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346832.967, "dur": 1.314, + "args": { + "External id": 451279,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8894 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346833.356, "dur": 0.857, + "args": { + "External id": 451280,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8895 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346834.508, "dur": 2.919, + "args": { + "External id": 451281,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8896 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346835.058, "dur": 2.286, + "args": { + "External id": 451282,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8897 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346837.899, "dur": 1.291, + "args": { + "External id": 451283,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8898 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346838.759, "dur": 0.363, + "args": { + "External id": 451284,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8899 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346839.476, "dur": 1.470, + "args": { + "External id": 451285,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8900 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346839.884, "dur": 0.993, + "args": { + "External id": 451286,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8901 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346841.284, "dur": 3.575, + "args": { + "External id": 451287,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8902 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346843.781, "dur": 1.009, + "args": { + "External id": 451288,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8903 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346845.146, "dur": 1.183, + "args": { + "External id": 451289,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8904 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346845.541, "dur": 0.713, + "args": { + "External id": 451290,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8905 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346846.598, "dur": 1.165, + "args": { + "External id": 451291,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8906 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346846.985, "dur": 0.702, + "args": { + "External id": 451292,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8907 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346848.031, "dur": 2.692, + "args": { + "External id": 451293,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8908 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346850.384, "dur": 0.271, + "args": { + "External id": 451294,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8909 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346851.010, "dur": 0.920, + "args": { + "External id": 451295,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8910 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346851.384, "dur": 0.484, + "args": { + "External id": 451296,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8911 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346852.186, "dur": 2.473, + "args": { + "External id": 451297,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8912 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346852.622, "dur": 1.968, + "args": { + "External id": 451298,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8913 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346854.908, "dur": 2.058, + "args": { + "External id": 451299,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8914 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346855.870, "dur": 0.926, + "args": { + "External id": 451300,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8915 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346857.308, "dur": 0.980, + "args": { + "External id": 451301,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8916 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346857.673, "dur": 0.458, + "args": { + "External id": 451302,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8917 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346858.559, "dur": 3.224, + "args": { + "External id": 451303,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8918 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346861.161, "dur": 0.560, + "args": { + "External id": 451304,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8919 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346862.039, "dur": 1.340, + "args": { + "External id": 451305,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8920 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346862.428, "dur": 0.627, + "args": { + "External id": 451306,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8921 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346863.621, "dur": 1.371, + "args": { + "External id": 451307,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8922 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346863.982, "dur": 0.944, + "args": { + "External id": 451308,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8923 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346865.280, "dur": 3.367, + "args": { + "External id": 451309,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8924 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346867.677, "dur": 0.905, + "args": { + "External id": 451310,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8925 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346868.901, "dur": 1.044, + "args": { + "External id": 451311,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8926 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346869.270, "dur": 0.613, + "args": { + "External id": 451312,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8927 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346870.392, "dur": 2.967, + "args": { + "External id": 451313,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8928 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346870.802, "dur": 2.268, + "args": { + "External id": 451314,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8929 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346873.721, "dur": 1.197, + "args": { + "External id": 451315,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8930 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346874.221, "dur": 0.626, + "args": { + "External id": 451316,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8931 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346875.247, "dur": 1.592, + "args": { + "External id": 451317,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8932 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346875.661, "dur": 0.999, + "args": { + "External id": 451318,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8933 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346877.092, "dur": 3.262, + "args": { + "External id": 451319,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8934 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346879.690, "dur": 0.584, + "args": { + "External id": 451320,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8935 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346880.605, "dur": 1.397, + "args": { + "External id": 451321,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8936 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346880.991, "dur": 0.834, + "args": { + "External id": 451322,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8937 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346882.284, "dur": 1.423, + "args": { + "External id": 451323,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8938 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346882.985, "dur": 0.655, + "args": { + "External id": 451324,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8939 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346883.959, "dur": 2.954, + "args": { + "External id": 451325,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8940 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346886.479, "dur": 0.370, + "args": { + "External id": 451326,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8941 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346887.153, "dur": 0.871, + "args": { + "External id": 451327,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8942 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346887.527, "dur": 0.406, + "args": { + "External id": 451328,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8943 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346888.277, "dur": 2.554, + "args": { + "External id": 451329,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8944 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346888.636, "dur": 2.040, + "args": { + "External id": 451330,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8945 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346891.140, "dur": 0.845, + "args": { + "External id": 451331,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8946 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346891.633, "dur": 0.281, + "args": { + "External id": 451332,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8947 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346892.263, "dur": 1.166, + "args": { + "External id": 451333,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8948 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346892.725, "dur": 0.638, + "args": { + "External id": 451334,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8949 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346893.707, "dur": 3.208, + "args": { + "External id": 451335,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8950 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346896.500, "dur": 0.346, + "args": { + "External id": 451336,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8951 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346897.170, "dur": 1.170, + "args": { + "External id": 451337,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8952 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346897.530, "dur": 0.741, + "args": { + "External id": 451338,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8953 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346898.585, "dur": 0.894, + "args": { + "External id": 451339,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8954 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346898.944, "dur": 0.465, + "args": { + "External id": 451340,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8955 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346899.731, "dur": 2.940, + "args": { + "External id": 451341,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8956 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346902.181, "dur": 0.419, + "args": { + "External id": 451342,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8957 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346902.914, "dur": 1.115, + "args": { + "External id": 451343,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8958 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346903.347, "dur": 0.592, + "args": { + "External id": 451344,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8959 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346904.285, "dur": 2.457, + "args": { + "External id": 451345,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8960 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346904.654, "dur": 1.918, + "args": { + "External id": 451346,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8961 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346906.987, "dur": 1.546, + "args": { + "External id": 451347,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8962 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346907.855, "dur": 0.415, + "args": { + "External id": 451348,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8963 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346908.872, "dur": 1.369, + "args": { + "External id": 451349,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8964 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346909.463, "dur": 0.709, + "args": { + "External id": 451350,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8965 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346910.495, "dur": 3.306, + "args": { + "External id": 451351,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8966 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346913.144, "dur": 0.581, + "args": { + "External id": 451352,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8967 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346914.081, "dur": 0.818, + "args": { + "External id": 451353,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8968 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346914.449, "dur": 0.377, + "args": { + "External id": 451354,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8969 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346915.154, "dur": 1.028, + "args": { + "External id": 451355,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8970 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346915.753, "dur": 0.359, + "args": { + "External id": 451356,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8971 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346916.465, "dur": 3.391, + "args": { + "External id": 451357,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8972 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346918.875, "dur": 0.822, + "args": { + "External id": 451358,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8973 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346920.311, "dur": 0.865, + "args": { + "External id": 451359,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8974 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346920.683, "dur": 0.428, + "args": { + "External id": 451360,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8975 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346921.430, "dur": 2.870, + "args": { + "External id": 451361,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8976 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346921.838, "dur": 2.159, + "args": { + "External id": 451362,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8977 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346924.545, "dur": 1.159, + "args": { + "External id": 451363,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8978 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346925.014, "dur": 0.626, + "args": { + "External id": 451364,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8979 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346926.033, "dur": 1.401, + "args": { + "External id": 451365,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8980 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346926.471, "dur": 0.899, + "args": { + "External id": 451366,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8981 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346927.691, "dur": 3.267, + "args": { + "External id": 451367,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8982 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346930.485, "dur": 0.407, + "args": { + "External id": 451368,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8983 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346931.216, "dur": 1.079, + "args": { + "External id": 451369,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8984 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346931.623, "dur": 0.457, + "args": { + "External id": 451370,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8985 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346932.537, "dur": 0.927, + "args": { + "External id": 451371,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8986 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346933.078, "dur": 0.315, + "args": { + "External id": 451372,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8987 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346933.716, "dur": 2.747, + "args": { + "External id": 451373,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8988 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346936.013, "dur": 0.379, + "args": { + "External id": 451374,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8989 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346936.707, "dur": 0.936, + "args": { + "External id": 451375,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8990 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346937.103, "dur": 0.464, + "args": { + "External id": 451376,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8991 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346938.087, "dur": 3.529, + "args": { + "External id": 451377,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8992 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346938.920, "dur": 2.612, + "args": { + "External id": 451378,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8993 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346941.922, "dur": 1.390, + "args": { + "External id": 451379,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8994 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346942.599, "dur": 0.648, + "args": { + "External id": 451380,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8995 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346943.603, "dur": 0.956, + "args": { + "External id": 451381,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8996 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346944.130, "dur": 0.358, + "args": { + "External id": 451382,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8997 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346944.850, "dur": 3.154, + "args": { + "External id": 451383,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 8998 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346947.351, "dur": 0.587, + "args": { + "External id": 451384,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8999 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346948.294, "dur": 2.013, + "args": { + "External id": 451385,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9000 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346948.965, "dur": 1.081, + "args": { + "External id": 451386,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9001 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346950.575, "dur": 1.561, + "args": { + "External id": 451387,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9002 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346951.245, "dur": 0.812, + "args": { + "External id": 451388,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9003 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346952.440, "dur": 3.376, + "args": { + "External id": 451389,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9004 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346955.099, "dur": 0.552, + "args": { + "External id": 451390,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9005 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346956.084, "dur": 1.080, + "args": { + "External id": 451391,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9006 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346956.723, "dur": 0.371, + "args": { + "External id": 451392,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9007 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346957.483, "dur": 2.786, + "args": { + "External id": 451393,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9008 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346957.947, "dur": 2.251, + "args": { + "External id": 451394,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9009 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346960.767, "dur": 1.388, + "args": { + "External id": 451395,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9010 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346961.609, "dur": 0.367, + "args": { + "External id": 451396,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9011 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346962.449, "dur": 1.725, + "args": { + "External id": 451397,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9012 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346963.141, "dur": 0.863, + "args": { + "External id": 451398,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9013 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346964.577, "dur": 3.134, + "args": { + "External id": 451399,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9014 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346967.223, "dur": 0.421, + "args": { + "External id": 451400,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9015 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346968.121, "dur": 0.997, + "args": { + "External id": 451401,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9016 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346968.655, "dur": 0.389, + "args": { + "External id": 451402,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9017 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346969.418, "dur": 1.294, + "args": { + "External id": 451403,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9018 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346969.875, "dur": 0.773, + "args": { + "External id": 451404,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9019 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346970.992, "dur": 2.867, + "args": { + "External id": 451405,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9020 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346973.378, "dur": 0.416, + "args": { + "External id": 451406,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9021 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346974.129, "dur": 1.145, + "args": { + "External id": 451407,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9022 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346974.658, "dur": 0.401, + "args": { + "External id": 451408,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9023 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346975.747, "dur": 3.078, + "args": { + "External id": 451409,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9024 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346976.176, "dur": 2.567, + "args": { + "External id": 451410,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9025 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346979.127, "dur": 1.219, + "args": { + "External id": 451411,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9026 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346979.654, "dur": 0.624, + "args": { + "External id": 451412,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9027 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346980.624, "dur": 1.566, + "args": { + "External id": 451413,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9028 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346981.080, "dur": 1.043, + "args": { + "External id": 451414,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9029 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346982.595, "dur": 2.996, + "args": { + "External id": 451415,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9030 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346984.980, "dur": 0.548, + "args": { + "External id": 451416,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9031 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346985.876, "dur": 1.102, + "args": { + "External id": 451417,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9032 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346986.358, "dur": 0.556, + "args": { + "External id": 451418,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9033 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346987.394, "dur": 1.305, + "args": { + "External id": 451419,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9034 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346988.063, "dur": 0.572, + "args": { + "External id": 451420,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9035 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346988.976, "dur": 2.530, + "args": { + "External id": 451421,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9036 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346990.901, "dur": 0.543, + "args": { + "External id": 451422,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9037 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346991.772, "dur": 1.293, + "args": { + "External id": 451423,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9038 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346992.287, "dur": 0.515, + "args": { + "External id": 451424,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9039 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346993.527, "dur": 2.990, + "args": { + "External id": 451425,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9040 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346993.943, "dur": 2.501, + "args": { + "External id": 451426,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9041 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346996.806, "dur": 1.517, + "args": { + "External id": 451427,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9042 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346997.567, "dur": 0.687, + "args": { + "External id": 451428,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9043 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008346998.620, "dur": 1.702, + "args": { + "External id": 451429,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9044 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008346999.435, "dur": 0.617, + "args": { + "External id": 451430,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9045 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347000.604, "dur": 3.270, + "args": { + "External id": 451431,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9046 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347003.256, "dur": 0.537, + "args": { + "External id": 451432,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9047 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347004.160, "dur": 1.309, + "args": { + "External id": 451433,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9048 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347004.737, "dur": 0.663, + "args": { + "External id": 451434,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9049 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347005.737, "dur": 1.396, + "args": { + "External id": 451435,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9050 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347006.426, "dur": 0.636, + "args": { + "External id": 451436,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9051 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347007.429, "dur": 3.316, + "args": { + "External id": 451437,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9052 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347009.912, "dur": 0.766, + "args": { + "External id": 451438,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9053 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347011.113, "dur": 1.486, + "args": { + "External id": 451439,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9054 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347011.778, "dur": 0.744, + "args": { + "External id": 451440,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9055 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347013.199, "dur": 2.856, + "args": { + "External id": 451441,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9056 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347013.924, "dur": 2.060, + "args": { + "External id": 451442,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9057 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347016.343, "dur": 2.097, + "args": { + "External id": 451443,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9058 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347016.966, "dur": 1.405, + "args": { + "External id": 451444,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9059 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347018.992, "dur": 1.431, + "args": { + "External id": 451445,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9060 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347019.435, "dur": 0.922, + "args": { + "External id": 451446,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9061 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347020.918, "dur": 2.852, + "args": { + "External id": 451447,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9062 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347023.163, "dur": 0.541, + "args": { + "External id": 451448,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9063 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347024.065, "dur": 0.763, + "args": { + "External id": 451449,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9064 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347024.545, "dur": 0.215, + "args": { + "External id": 451450,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9065 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347025.271, "dur": 1.165, + "args": { + "External id": 451451,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9066 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347025.817, "dur": 0.556, + "args": { + "External id": 451452,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9067 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347026.729, "dur": 3.035, + "args": { + "External id": 451453,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9068 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347029.113, "dur": 0.578, + "args": { + "External id": 451454,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9069 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347030.295, "dur": 0.996, + "args": { + "External id": 451455,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9070 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347030.890, "dur": 0.328, + "args": { + "External id": 451456,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9071 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347031.666, "dur": 2.995, + "args": { + "External id": 451457,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9072 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347032.551, "dur": 2.010, + "args": { + "External id": 451458,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9073 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347035.082, "dur": 1.069, + "args": { + "External id": 451459,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9074 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347035.639, "dur": 0.433, + "args": { + "External id": 451460,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9075 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347036.431, "dur": 0.964, + "args": { + "External id": 451461,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9076 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347036.900, "dur": 0.425, + "args": { + "External id": 451462,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9077 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347037.685, "dur": 2.974, + "args": { + "External id": 451463,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9078 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347040.243, "dur": 0.351, + "args": { + "External id": 451464,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9079 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347040.944, "dur": 0.984, + "args": { + "External id": 451465,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9080 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347041.508, "dur": 0.352, + "args": { + "External id": 451466,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9081 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347042.200, "dur": 1.138, + "args": { + "External id": 451467,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9082 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347042.642, "dur": 0.629, + "args": { + "External id": 451468,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9083 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347043.615, "dur": 4.045, + "args": { + "External id": 451469,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9084 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347047.123, "dur": 0.463, + "args": { + "External id": 451470,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9085 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347047.931, "dur": 1.093, + "args": { + "External id": 451471,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9086 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347048.430, "dur": 0.529, + "args": { + "External id": 451472,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9087 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347049.436, "dur": 2.861, + "args": { + "External id": 451473,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9088 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347050.143, "dur": 1.992, + "args": { + "External id": 451474,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9089 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347052.587, "dur": 1.501, + "args": { + "External id": 451475,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9090 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347053.029, "dur": 0.995, + "args": { + "External id": 451476,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9091 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347054.584, "dur": 1.159, + "args": { + "External id": 451477,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9092 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347055.004, "dur": 0.672, + "args": { + "External id": 451478,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9093 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347056.166, "dur": 3.117, + "args": { + "External id": 451479,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9094 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347058.694, "dur": 0.522, + "args": { + "External id": 451480,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9095 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347059.645, "dur": 1.219, + "args": { + "External id": 451481,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9096 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347060.150, "dur": 0.648, + "args": { + "External id": 451482,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9097 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347061.149, "dur": 1.091, + "args": { + "External id": 451483,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9098 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347061.626, "dur": 0.547, + "args": { + "External id": 451484,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9099 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347062.517, "dur": 3.259, + "args": { + "External id": 451485,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9100 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347065.230, "dur": 0.480, + "args": { + "External id": 451486,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9101 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347066.289, "dur": 1.173, + "args": { + "External id": 451487,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9102 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347067.091, "dur": 0.306, + "args": { + "External id": 451488,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9103 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347067.730, "dur": 2.530, + "args": { + "External id": 451489,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9104 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347068.229, "dur": 1.781, + "args": { + "External id": 451490,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9105 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347070.533, "dur": 1.113, + "args": { + "External id": 451491,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9106 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347071.063, "dur": 0.516, + "args": { + "External id": 451492,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9107 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347072.034, "dur": 1.139, + "args": { + "External id": 451493,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9108 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347072.694, "dur": 0.413, + "args": { + "External id": 451494,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9109 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347073.452, "dur": 3.469, + "args": { + "External id": 451495,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9110 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347076.088, "dur": 0.765, + "args": { + "External id": 451496,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9111 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347077.233, "dur": 0.979, + "args": { + "External id": 451497,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9112 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347077.723, "dur": 0.425, + "args": { + "External id": 451498,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9113 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347078.479, "dur": 0.907, + "args": { + "External id": 451499,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9114 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347079.013, "dur": 0.305, + "args": { + "External id": 451500,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9115 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347079.852, "dur": 16.836, + "args": { + "External id": 451501,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9116 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347095.183, "dur": 0.900, + "args": { + "External id": 451502,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9117 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347097.185, "dur": 1.378, + "args": { + "External id": 451503,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9118 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347097.912, "dur": 0.582, + "args": { + "External id": 451504,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9119 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347098.835, "dur": 2.699, + "args": { + "External id": 451505,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9120 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347099.340, "dur": 2.117, + "args": { + "External id": 451506,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9121 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347101.806, "dur": 1.155, + "args": { + "External id": 451507,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9122 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347102.348, "dur": 0.542, + "args": { + "External id": 451508,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9123 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347103.248, "dur": 1.496, + "args": { + "External id": 451509,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9124 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347103.702, "dur": 0.970, + "args": { + "External id": 451510,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9125 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347105.210, "dur": 3.002, + "args": { + "External id": 451511,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9126 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347107.703, "dur": 0.438, + "args": { + "External id": 451512,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9127 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347108.499, "dur": 1.143, + "args": { + "External id": 451513,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9128 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347108.970, "dur": 0.608, + "args": { + "External id": 451514,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9129 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347110.114, "dur": 1.113, + "args": { + "External id": 451515,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9130 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347110.750, "dur": 0.409, + "args": { + "External id": 451516,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9131 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347111.606, "dur": 3.446, + "args": { + "External id": 451517,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9132 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347114.287, "dur": 0.690, + "args": { + "External id": 451518,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9133 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347115.321, "dur": 1.115, + "args": { + "External id": 451519,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9134 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347115.988, "dur": 0.375, + "args": { + "External id": 451520,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9135 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347116.706, "dur": 2.739, + "args": { + "External id": 451521,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9136 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347117.513, "dur": 1.855, + "args": { + "External id": 451522,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9137 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347119.712, "dur": 1.024, + "args": { + "External id": 451523,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9138 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347120.200, "dur": 0.468, + "args": { + "External id": 451524,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9139 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347121.142, "dur": 1.001, + "args": { + "External id": 451525,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9140 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347121.591, "dur": 0.482, + "args": { + "External id": 451526,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9141 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347122.406, "dur": 3.011, + "args": { + "External id": 451527,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9142 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347125.014, "dur": 0.332, + "args": { + "External id": 451528,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9143 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347125.703, "dur": 0.958, + "args": { + "External id": 451529,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9144 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347126.213, "dur": 0.378, + "args": { + "External id": 451530,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9145 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347126.964, "dur": 1.397, + "args": { + "External id": 451531,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9146 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347127.622, "dur": 0.671, + "args": { + "External id": 451532,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9147 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347128.623, "dur": 3.041, + "args": { + "External id": 451533,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9148 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347130.848, "dur": 0.750, + "args": { + "External id": 451534,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9149 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347131.926, "dur": 1.079, + "args": { + "External id": 451535,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9150 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347132.483, "dur": 0.450, + "args": { + "External id": 451536,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9151 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347133.279, "dur": 2.855, + "args": { + "External id": 451537,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9152 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347133.782, "dur": 2.186, + "args": { + "External id": 451538,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9153 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347136.514, "dur": 0.828, + "args": { + "External id": 451539,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9154 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347137.045, "dur": 0.227, + "args": { + "External id": 451540,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9155 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347137.615, "dur": 0.938, + "args": { + "External id": 451541,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9156 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347138.107, "dur": 0.376, + "args": { + "External id": 451542,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9157 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347138.939, "dur": 3.089, + "args": { + "External id": 451543,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9158 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347141.412, "dur": 0.546, + "args": { + "External id": 451544,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9159 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347142.437, "dur": 1.243, + "args": { + "External id": 451545,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9160 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347142.945, "dur": 0.665, + "args": { + "External id": 451546,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9161 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347144.054, "dur": 1.394, + "args": { + "External id": 451547,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9162 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347144.992, "dur": 0.383, + "args": { + "External id": 451548,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9163 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347145.912, "dur": 3.113, + "args": { + "External id": 451549,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9164 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347148.590, "dur": 0.362, + "args": { + "External id": 451550,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9165 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347149.310, "dur": 0.844, + "args": { + "External id": 451551,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9166 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347149.751, "dur": 0.323, + "args": { + "External id": 451552,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9167 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347150.415, "dur": 2.523, + "args": { + "External id": 451553,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9168 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347150.871, "dur": 1.994, + "args": { + "External id": 451554,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9169 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347153.310, "dur": 0.887, + "args": { + "External id": 451555,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9170 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347153.790, "dur": 0.336, + "args": { + "External id": 451556,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9171 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347154.455, "dur": 1.166, + "args": { + "External id": 451557,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9172 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347154.962, "dur": 0.588, + "args": { + "External id": 451558,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9173 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347155.884, "dur": 2.807, + "args": { + "External id": 451559,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9174 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347158.357, "dur": 0.261, + "args": { + "External id": 451560,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9175 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347158.984, "dur": 0.970, + "args": { + "External id": 451561,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9176 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347159.553, "dur": 0.333, + "args": { + "External id": 451562,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9177 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347160.215, "dur": 1.099, + "args": { + "External id": 451563,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9178 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347160.739, "dur": 0.506, + "args": { + "External id": 451564,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9179 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347161.697, "dur": 3.111, + "args": { + "External id": 451565,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9180 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347164.287, "dur": 0.450, + "args": { + "External id": 451566,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9181 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347165.409, "dur": 1.341, + "args": { + "External id": 451567,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9182 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347166.118, "dur": 0.565, + "args": { + "External id": 451568,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9183 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347167.010, "dur": 2.641, + "args": { + "External id": 451569,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9184 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347167.489, "dur": 2.088, + "args": { + "External id": 451570,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9185 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347169.916, "dur": 0.834, + "args": { + "External id": 451571,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9186 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347170.453, "dur": 0.225, + "args": { + "External id": 451572,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9187 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347171.017, "dur": 1.149, + "args": { + "External id": 451573,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9188 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347171.517, "dur": 0.578, + "args": { + "External id": 451574,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9189 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347172.474, "dur": 3.683, + "args": { + "External id": 451575,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9190 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347175.462, "dur": 0.620, + "args": { + "External id": 451576,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9191 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347176.618, "dur": 0.900, + "args": { + "External id": 451577,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9192 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347177.110, "dur": 0.339, + "args": { + "External id": 451578,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9193 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347177.782, "dur": 1.502, + "args": { + "External id": 451579,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9194 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347178.640, "dur": 0.574, + "args": { + "External id": 451580,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9195 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347179.549, "dur": 2.869, + "args": { + "External id": 451581,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9196 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347181.917, "dur": 0.426, + "args": { + "External id": 451582,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9197 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347182.676, "dur": 1.002, + "args": { + "External id": 451583,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9198 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347183.262, "dur": 0.338, + "args": { + "External id": 451584,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9199 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347204.498, "dur": 2.784, + "args": { + "External id": 451585,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9200 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347205.227, "dur": 1.981, + "args": { + "External id": 451586,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9201 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347207.588, "dur": 1.226, + "args": { + "External id": 451587,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9202 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347208.188, "dur": 0.548, + "args": { + "External id": 451588,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9203 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347209.071, "dur": 1.121, + "args": { + "External id": 451589,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9204 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347209.569, "dur": 0.551, + "args": { + "External id": 451590,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9205 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347210.450, "dur": 2.841, + "args": { + "External id": 451591,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9206 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347212.953, "dur": 0.265, + "args": { + "External id": 451592,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9207 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347213.588, "dur": 1.006, + "args": { + "External id": 451593,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9208 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347214.118, "dur": 0.402, + "args": { + "External id": 451594,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9209 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347214.853, "dur": 0.972, + "args": { + "External id": 451595,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9210 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347215.314, "dur": 0.442, + "args": { + "External id": 451596,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9211 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347216.082, "dur": 2.667, + "args": { + "External id": 451597,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9212 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347218.213, "dur": 0.469, + "args": { + "External id": 451598,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9213 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347219.014, "dur": 0.840, + "args": { + "External id": 451599,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9214 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347219.472, "dur": 0.309, + "args": { + "External id": 451600,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9215 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347220.109, "dur": 2.934, + "args": { + "External id": 451601,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9216 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347220.586, "dur": 2.379, + "args": { + "External id": 451602,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9217 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347223.314, "dur": 1.320, + "args": { + "External id": 451603,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9218 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347223.949, "dur": 0.625, + "args": { + "External id": 451604,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9219 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347225.102, "dur": 1.074, + "args": { + "External id": 451605,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9220 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347225.599, "dur": 0.506, + "args": { + "External id": 451606,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9221 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347226.444, "dur": 2.610, + "args": { + "External id": 451607,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9222 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347228.618, "dur": 0.363, + "args": { + "External id": 451608,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9223 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347229.348, "dur": 1.130, + "args": { + "External id": 451609,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9224 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347229.938, "dur": 0.461, + "args": { + "External id": 451610,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9225 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347230.746, "dur": 6.553, + "args": { + "External id": 451611,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9226 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347235.147, "dur": 1.865, + "args": { + "External id": 451612,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9227 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347237.576, "dur": 0.917, + "args": { + "External id": 451613,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9228 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347238.092, "dur": 0.335, + "args": { + "External id": 451614,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9229 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347239.002, "dur": 1.103, + "args": { + "External id": 451615,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9230 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347239.492, "dur": 0.543, + "args": { + "External id": 451616,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9231 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347240.676, "dur": 3.051, + "args": { + "External id": 451617,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9232 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347243.096, "dur": 0.560, + "args": { + "External id": 451618,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9233 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347244.207, "dur": 1.074, + "args": { + "External id": 451619,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9234 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347244.779, "dur": 0.437, + "args": { + "External id": 451620,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9235 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347245.892, "dur": 1.405, + "args": { + "External id": 451621,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9236 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347246.418, "dur": 0.812, + "args": { + "External id": 451622,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9237 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347247.747, "dur": 3.016, + "args": { + "External id": 451623,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9238 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347250.103, "dur": 0.594, + "args": { + "External id": 451624,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9239 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347251.037, "dur": 0.925, + "args": { + "External id": 451625,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9240 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347251.455, "dur": 0.444, + "args": { + "External id": 451626,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9241 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347252.343, "dur": 2.739, + "args": { + "External id": 451627,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9242 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347252.767, "dur": 2.054, + "args": { + "External id": 451628,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9243 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347255.372, "dur": 1.256, + "args": { + "External id": 451629,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9244 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347256.047, "dur": 0.518, + "args": { + "External id": 451630,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9245 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347256.901, "dur": 1.338, + "args": { + "External id": 451631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9246 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347257.795, "dur": 0.377, + "args": { + "External id": 451632,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9247 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347258.520, "dur": 2.567, + "args": { + "External id": 451633,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9248 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347260.616, "dur": 0.402, + "args": { + "External id": 451634,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9249 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 4183441, "tid": 4183441, + "ts": 676008347261.720, "dur": 0.882, + "args": { + "External id": 451635,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9250 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347262.145, "dur": 0.393, + "args": { + "External id": 451636,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9251 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 4183441, "tid": 4183441, + "ts": 676008347283.700, "dur": 103.455, + "args": { + "External id": 451637,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9252 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 4183441, "tid": 4183441, + "ts": 676008347474.323, "dur": 124.682, + "args": { + "External id": 451638,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[219], [], [], [], []], "Ev Idx": 9253 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 4183441, "tid": 4183441, + "ts": 676008347533.589, "dur": 46.778, + "args": { + "External id": 451639,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[219], [], [], [], []], "Ev Idx": 9254 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 4183441, "tid": 4183441, + "ts": 676008347546.271, "dur": 0.881, + "args": { + "External id": 451640,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9255 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "Redistribute", "pid": 4183441, "tid": 4183441, + "ts": 676008347941.856, "dur": 941.349, + "args": { + "External id": 451641,"Sequence number": 5285608, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "False"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9256 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 4183441, "tid": 4183441, + "ts": 676008347992.489, "dur": 52.639, + "args": { + "External id": 451642,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9257 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008347997.986, "dur": 1.429, + "args": { + "External id": 451643,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9258 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008348001.407, "dur": 0.640, + "args": { + "External id": 451644,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9259 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::all_reduce", "pid": 4183441, "tid": 4183441, + "ts": 676008348071.797, "dur": 454.107, + "args": { + "External id": 451645,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["float", "", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9260 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 4183441, "tid": 4183441, + "ts": 676008348076.445, "dur": 63.888, + "args": { + "External id": 451646,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9261 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 4183441, "tid": 4183441, + "ts": 676008348079.771, "dur": 25.224, + "args": { + "External id": 451647,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "0"], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9262 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676008348098.673, "dur": 5.394, + "args": { + "External id": 451648,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9263 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 4183441, "tid": 4183441, + "ts": 676008348106.687, "dur": 33.012, + "args": { + "External id": 451649,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9264 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "c10d::allreduce_", "pid": 4183441, "tid": 4183441, + "ts": 676008348150.562, "dur": 371.573, + "args": { + "External id": 451650,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "-1"], "Input type": ["TensorList", "", "", "", "Scalar"], "Input Strides": [[[]], [], [], [], []], "Input Dims": [[[]], [], [], [], []], "Ev Idx": 9265 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676008348177.191, "dur": 338.397, + "args": { + "External id": 451651,"Record function id": 0, "Collective name": "allreduce", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 5, "Input Strides": [[[]], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "5", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1, "Process Group Name": "0", "Input type": ["TensorList", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[[]], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 9266, "In msg nelems": 1 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "nccl:all_reduce", "pid": 4183441, "tid": 4183441, + "ts": 676008348195.151, "dur": 314.810, + "args": { + "External id": 451652,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9267 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 4183441, "tid": 4183441, + "ts": 676008348592.748, "dur": 252.647, + "args": { + "External id": 451653,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9268 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::wait_tensor", "pid": 4183441, "tid": 4183441, + "ts": 676008348724.274, "dur": 33.112, + "args": { + "External id": 451654,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9269 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 4183441, "tid": 4183441, + "ts": 676008348742.405, "dur": 5.898, + "args": { + "External id": 451655,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "5", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 9270, "In msg nelems": 0, "Rank": 5, "In split size": "[]", "Out split size": "[]" + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 4183441, "tid": 4183441, + "ts": 676008348789.686, "dur": 49.840, + "args": { + "External id": 451656,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9271 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008348792.300, "dur": 1.044, + "args": { + "External id": 451657,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9272 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008348794.873, "dur": 0.594, + "args": { + "External id": 451658,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9273 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "_ToTorchTensor", "pid": 4183441, "tid": 4183441, + "ts": 676008348899.663, "dur": 34.946, + "args": { + "External id": 451659,"Sequence number": 5285609, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9274 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 4183441, "tid": 4183441, + "ts": 676008348911.542, "dur": 16.287, + "args": { + "External id": 451660,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9275 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 4183441, "tid": 4183441, + "ts": 676008348914.418, "dur": 12.244, + "args": { + "External id": 451661,"Record function id": 0, "Concrete Inputs": ["", "[]"], "Input type": ["float", "ScalarList"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9276 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 4183441, "tid": 4183441, + "ts": 676008349337.316, "dur": 41.927, + "args": { + "External id": 451662,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "double", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9277 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::reciprocal", "pid": 4183441, "tid": 4183441, + "ts": 676008349394.450, "dur": 24.924, + "args": { + "External id": 451663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9278 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::mul", "pid": 4183441, "tid": 4183441, + "ts": 676008349428.935, "dur": 24.747, + "args": { + "External id": 451664,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "double"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9279 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::clamp", "pid": 4183441, "tid": 4183441, + "ts": 676008349466.392, "dur": 23.680, + "args": { + "External id": 451665,"Record function id": 0, "Concrete Inputs": ["", "", "1."], "Input type": ["float", "", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 9280 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008349470.145, "dur": 0.443, + "args": { + "External id": 451666,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9281 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 4183441, "tid": 4183441, + "ts": 676008349507.838, "dur": 0.410, + "args": { + "External id": 451667,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 9282 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 4183441, "tid": 4183441, + "ts": 676008349600.329, "dur": 542.412, + "args": { + "External id": 451668,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9283 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 4183441, "tid": 4183441, + "ts": 676008350042.026, "dur": 73.792, + "args": { + "External id": 451669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9284 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::isnan", "pid": 4183441, "tid": 4183441, + "ts": 676008350180.966, "dur": 27.832, + "args": { + "External id": 451670,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9285 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 4183441, "tid": 4183441, + "ts": 676008350184.757, "dur": 23.464, + "args": { + "External id": 451671,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9286 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183441, "tid": 4183441, + "ts": 676008350213.796, "dur": 1123.305, + "args": { + "External id": 451672,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9287 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 4183441, + "ts": 676008350215.355, "dur": 1121.505, + "args": { + "External id": 451673,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9288 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 4183441, + "ts": 676008350217.344, "dur": 1118.681, + "args": { + "External id": 451674,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9289 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::isinf", "pid": 4183441, "tid": 4183441, + "ts": 676008351343.566, "dur": 60.218, + "args": { + "External id": 451675,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9290 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676008351346.547, "dur": 34.673, + "args": { + "External id": 451676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9291 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 4183441, "tid": 4183441, + "ts": 676008351353.136, "dur": 3.675, + "args": { + "External id": 451677,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9292 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 4183441, "tid": 4183441, + "ts": 676008351358.573, "dur": 22.289, + "args": { + "External id": 451678,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], [1]], "Input Dims": [[], [0]], "Ev Idx": 9293 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 4183441, "tid": 4183441, + "ts": 676008351363.568, "dur": 2.748, + "args": { + "External id": 451679,"Record function id": 0, "Concrete Inputs": ["", "[]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9294 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 4183441, "tid": 4183441, + "ts": 676008351382.904, "dur": 20.047, + "args": { + "External id": 451680,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9295 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 4183441, "tid": 4183441, + "ts": 676008351406.062, "dur": 38.051, + "args": { + "External id": 451681,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9296 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 4183441, "tid": 4183441, + "ts": 676008351407.168, "dur": 36.766, + "args": { + "External id": 451682,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9297 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 4183441, "tid": 4183441, + "ts": 676008351407.975, "dur": 35.647, + "args": { + "External id": 451683,"Sequence number": 5285610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9298 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#OptimizersContainer.step", "pid": 4183441, "tid": 4183441, + "ts": 676008351475.657, "dur": 4442.256, + "args": { + "External id": 451684,"Record function id": 0, "Ev Idx": 9299 + } + }, + { + "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#AdamW.step", "pid": 4183441, "tid": 4183441, + "ts": 676008351509.624, "dur": 4386.532, + "args": { + "External id": 451685,"Record function id": 0, "Ev Idx": 9300 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_add_", "pid": 4183441, "tid": 4183441, + "ts": 676008352510.239, "dur": 216.407, + "args": { + "External id": 451686,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9301 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352527.142, "dur": 1.091, + "args": { + "External id": 451687,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9302 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352529.317, "dur": 0.275, + "args": { + "External id": 451688,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9303 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352530.099, "dur": 0.211, + "args": { + "External id": 451689,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9304 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352530.790, "dur": 0.066, + "args": { + "External id": 451690,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9305 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352531.298, "dur": 0.065, + "args": { + "External id": 451691,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9306 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352531.854, "dur": 0.065, + "args": { + "External id": 451692,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9307 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352532.351, "dur": 0.053, + "args": { + "External id": 451693,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9308 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352532.843, "dur": 0.090, + "args": { + "External id": 451694,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9309 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352533.444, "dur": 0.068, + "args": { + "External id": 451695,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9310 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352533.916, "dur": 0.085, + "args": { + "External id": 451696,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9311 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352534.415, "dur": 0.066, + "args": { + "External id": 451697,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9312 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352534.828, "dur": 0.278, + "args": { + "External id": 451698,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9313 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352535.374, "dur": 0.067, + "args": { + "External id": 451699,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9314 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352535.850, "dur": 0.056, + "args": { + "External id": 451700,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9315 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352536.215, "dur": 0.067, + "args": { + "External id": 451701,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9316 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352536.635, "dur": 0.067, + "args": { + "External id": 451702,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9317 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352537.075, "dur": 0.066, + "args": { + "External id": 451703,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9318 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352537.515, "dur": 0.064, + "args": { + "External id": 451704,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9319 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352537.961, "dur": 0.067, + "args": { + "External id": 451705,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9320 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352538.356, "dur": 0.082, + "args": { + "External id": 451706,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9321 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352538.874, "dur": 0.067, + "args": { + "External id": 451707,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9322 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352539.404, "dur": 0.064, + "args": { + "External id": 451708,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9323 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352539.836, "dur": 0.065, + "args": { + "External id": 451709,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9324 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352540.201, "dur": 0.065, + "args": { + "External id": 451710,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9325 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352540.552, "dur": 0.063, + "args": { + "External id": 451711,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9326 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352541.005, "dur": 0.063, + "args": { + "External id": 451712,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9327 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352541.743, "dur": 0.060, + "args": { + "External id": 451713,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9328 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352542.141, "dur": 0.066, + "args": { + "External id": 451714,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9329 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352542.566, "dur": 0.061, + "args": { + "External id": 451715,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9330 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352543.231, "dur": 0.064, + "args": { + "External id": 451716,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9331 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352543.665, "dur": 0.062, + "args": { + "External id": 451717,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9332 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352544.109, "dur": 0.063, + "args": { + "External id": 451718,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9333 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352544.592, "dur": 0.062, + "args": { + "External id": 451719,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9334 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352545.025, "dur": 0.067, + "args": { + "External id": 451720,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9335 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352545.408, "dur": 0.064, + "args": { + "External id": 451721,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9336 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352546.106, "dur": 0.068, + "args": { + "External id": 451722,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9337 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352546.712, "dur": 0.069, + "args": { + "External id": 451723,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9338 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352547.121, "dur": 0.067, + "args": { + "External id": 451724,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9339 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352547.581, "dur": 0.070, + "args": { + "External id": 451725,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9340 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352548.006, "dur": 0.066, + "args": { + "External id": 451726,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9341 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352548.396, "dur": 0.070, + "args": { + "External id": 451727,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9342 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352548.840, "dur": 0.245, + "args": { + "External id": 451728,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9343 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352549.575, "dur": 0.050, + "args": { + "External id": 451729,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9344 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352550.052, "dur": 0.063, + "args": { + "External id": 451730,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9345 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352550.515, "dur": 0.066, + "args": { + "External id": 451731,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9346 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352550.943, "dur": 0.069, + "args": { + "External id": 451732,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9347 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352551.368, "dur": 0.282, + "args": { + "External id": 451733,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9348 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352552.257, "dur": 0.092, + "args": { + "External id": 451734,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9349 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352552.749, "dur": 0.276, + "args": { + "External id": 451735,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9350 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352553.611, "dur": 0.091, + "args": { + "External id": 451736,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9351 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352554.181, "dur": 0.067, + "args": { + "External id": 451737,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9352 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352554.599, "dur": 0.068, + "args": { + "External id": 451738,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9353 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352555.062, "dur": 0.069, + "args": { + "External id": 451739,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9354 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352555.490, "dur": 0.082, + "args": { + "External id": 451740,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9355 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352555.925, "dur": 0.069, + "args": { + "External id": 451741,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9356 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352556.339, "dur": 0.066, + "args": { + "External id": 451742,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9357 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352556.762, "dur": 0.067, + "args": { + "External id": 451743,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9358 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352557.307, "dur": 0.067, + "args": { + "External id": 451744,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9359 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352557.838, "dur": 0.057, + "args": { + "External id": 451745,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9360 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352558.354, "dur": 0.067, + "args": { + "External id": 451746,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9361 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352558.741, "dur": 0.067, + "args": { + "External id": 451747,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9362 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352559.167, "dur": 0.064, + "args": { + "External id": 451748,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9363 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352559.602, "dur": 0.070, + "args": { + "External id": 451749,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9364 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352560.061, "dur": 0.066, + "args": { + "External id": 451750,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9365 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352560.463, "dur": 0.071, + "args": { + "External id": 451751,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9366 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352560.950, "dur": 0.054, + "args": { + "External id": 451752,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9367 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352561.362, "dur": 0.066, + "args": { + "External id": 451753,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9368 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352561.774, "dur": 0.052, + "args": { + "External id": 451754,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9369 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352562.165, "dur": 0.069, + "args": { + "External id": 451755,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9370 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352562.678, "dur": 0.067, + "args": { + "External id": 451756,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9371 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352563.005, "dur": 0.264, + "args": { + "External id": 451757,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9372 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352563.768, "dur": 0.084, + "args": { + "External id": 451758,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9373 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352564.165, "dur": 0.090, + "args": { + "External id": 451759,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9374 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352564.718, "dur": 0.263, + "args": { + "External id": 451760,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9375 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352565.340, "dur": 0.066, + "args": { + "External id": 451761,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9376 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352565.775, "dur": 0.083, + "args": { + "External id": 451762,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9377 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352566.220, "dur": 0.066, + "args": { + "External id": 451763,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9378 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352566.674, "dur": 0.255, + "args": { + "External id": 451764,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9379 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352567.315, "dur": 0.294, + "args": { + "External id": 451765,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9380 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352567.952, "dur": 0.269, + "args": { + "External id": 451766,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9381 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352568.761, "dur": 0.093, + "args": { + "External id": 451767,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9382 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352569.242, "dur": 0.069, + "args": { + "External id": 451768,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9383 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352569.656, "dur": 0.069, + "args": { + "External id": 451769,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9384 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352570.098, "dur": 0.066, + "args": { + "External id": 451770,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9385 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352570.549, "dur": 0.095, + "args": { + "External id": 451771,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9386 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352570.938, "dur": 0.067, + "args": { + "External id": 451772,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9387 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352571.313, "dur": 0.069, + "args": { + "External id": 451773,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9388 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352571.742, "dur": 0.065, + "args": { + "External id": 451774,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9389 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352572.213, "dur": 0.072, + "args": { + "External id": 451775,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9390 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352572.599, "dur": 0.073, + "args": { + "External id": 451776,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9391 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352572.970, "dur": 0.064, + "args": { + "External id": 451777,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9392 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352573.393, "dur": 0.071, + "args": { + "External id": 451778,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9393 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352573.830, "dur": 0.059, + "args": { + "External id": 451779,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9394 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352574.238, "dur": 0.064, + "args": { + "External id": 451780,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9395 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352574.633, "dur": 0.073, + "args": { + "External id": 451781,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9396 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352575.138, "dur": 0.075, + "args": { + "External id": 451782,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9397 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352575.577, "dur": 0.065, + "args": { + "External id": 451783,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9398 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352576.018, "dur": 0.069, + "args": { + "External id": 451784,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9399 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352576.502, "dur": 0.063, + "args": { + "External id": 451785,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9400 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352576.888, "dur": 0.070, + "args": { + "External id": 451786,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9401 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352577.260, "dur": 0.066, + "args": { + "External id": 451787,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9402 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352578.222, "dur": 0.070, + "args": { + "External id": 451788,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9403 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352578.578, "dur": 0.064, + "args": { + "External id": 451789,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9404 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352579.292, "dur": 0.067, + "args": { + "External id": 451790,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9405 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352579.723, "dur": 0.068, + "args": { + "External id": 451791,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9406 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352580.188, "dur": 0.065, + "args": { + "External id": 451792,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9407 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352580.605, "dur": 0.063, + "args": { + "External id": 451793,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9408 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352581.222, "dur": 0.249, + "args": { + "External id": 451794,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9409 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352581.998, "dur": 0.067, + "args": { + "External id": 451795,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9410 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352582.436, "dur": 0.270, + "args": { + "External id": 451796,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9411 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352583.179, "dur": 0.073, + "args": { + "External id": 451797,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9412 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352583.831, "dur": 0.084, + "args": { + "External id": 451798,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9413 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352584.247, "dur": 0.086, + "args": { + "External id": 451799,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9414 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352584.791, "dur": 0.267, + "args": { + "External id": 451800,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9415 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352585.445, "dur": 0.066, + "args": { + "External id": 451801,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9416 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352585.962, "dur": 0.064, + "args": { + "External id": 451802,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9417 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352586.379, "dur": 0.069, + "args": { + "External id": 451803,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9418 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352586.755, "dur": 0.072, + "args": { + "External id": 451804,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9419 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352587.173, "dur": 0.102, + "args": { + "External id": 451805,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9420 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352587.656, "dur": 0.286, + "args": { + "External id": 451806,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9421 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352588.336, "dur": 0.104, + "args": { + "External id": 451807,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9422 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352588.720, "dur": 0.110, + "args": { + "External id": 451808,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9423 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352589.112, "dur": 0.064, + "args": { + "External id": 451809,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9424 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352589.692, "dur": 0.068, + "args": { + "External id": 451810,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9425 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352590.132, "dur": 0.067, + "args": { + "External id": 451811,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9426 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352590.515, "dur": 0.091, + "args": { + "External id": 451812,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9427 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352590.981, "dur": 0.066, + "args": { + "External id": 451813,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9428 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352591.395, "dur": 0.067, + "args": { + "External id": 451814,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9429 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352591.757, "dur": 0.061, + "args": { + "External id": 451815,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9430 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352592.279, "dur": 0.063, + "args": { + "External id": 451816,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9431 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352592.802, "dur": 0.067, + "args": { + "External id": 451817,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9432 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352593.205, "dur": 0.063, + "args": { + "External id": 451818,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9433 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352593.684, "dur": 0.068, + "args": { + "External id": 451819,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9434 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352594.067, "dur": 0.069, + "args": { + "External id": 451820,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9435 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352594.403, "dur": 0.067, + "args": { + "External id": 451821,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9436 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352594.858, "dur": 0.067, + "args": { + "External id": 451822,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9437 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352595.249, "dur": 0.067, + "args": { + "External id": 451823,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9438 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352595.654, "dur": 0.067, + "args": { + "External id": 451824,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9439 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352596.299, "dur": 0.066, + "args": { + "External id": 451825,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9440 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352596.676, "dur": 0.069, + "args": { + "External id": 451826,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9441 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352597.180, "dur": 0.070, + "args": { + "External id": 451827,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9442 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352597.718, "dur": 0.067, + "args": { + "External id": 451828,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9443 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352598.069, "dur": 0.069, + "args": { + "External id": 451829,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9444 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352598.434, "dur": 0.066, + "args": { + "External id": 451830,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9445 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352598.760, "dur": 0.055, + "args": { + "External id": 451831,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9446 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352599.083, "dur": 0.050, + "args": { + "External id": 451832,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9447 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352599.745, "dur": 0.068, + "args": { + "External id": 451833,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9448 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352600.119, "dur": 0.052, + "args": { + "External id": 451834,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9449 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352600.761, "dur": 0.066, + "args": { + "External id": 451835,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9450 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352601.325, "dur": 0.053, + "args": { + "External id": 451836,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9451 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352602.045, "dur": 0.062, + "args": { + "External id": 451837,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9452 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352602.385, "dur": 0.064, + "args": { + "External id": 451838,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9453 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352602.867, "dur": 0.065, + "args": { + "External id": 451839,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9454 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352603.398, "dur": 0.060, + "args": { + "External id": 451840,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9455 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352603.951, "dur": 0.067, + "args": { + "External id": 451841,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9456 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352604.272, "dur": 0.064, + "args": { + "External id": 451842,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9457 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352604.880, "dur": 0.061, + "args": { + "External id": 451843,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9458 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352605.196, "dur": 0.062, + "args": { + "External id": 451844,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9459 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352605.727, "dur": 0.069, + "args": { + "External id": 451845,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9460 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352606.094, "dur": 0.053, + "args": { + "External id": 451846,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9461 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352606.620, "dur": 0.065, + "args": { + "External id": 451847,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9462 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352606.961, "dur": 0.050, + "args": { + "External id": 451848,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9463 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352607.536, "dur": 0.057, + "args": { + "External id": 451849,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9464 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352607.838, "dur": 0.052, + "args": { + "External id": 451850,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9465 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352608.304, "dur": 0.066, + "args": { + "External id": 451851,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9466 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352608.612, "dur": 0.052, + "args": { + "External id": 451852,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9467 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352609.202, "dur": 0.064, + "args": { + "External id": 451853,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9468 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352609.518, "dur": 0.052, + "args": { + "External id": 451854,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9469 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352610.017, "dur": 0.061, + "args": { + "External id": 451855,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9470 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352610.331, "dur": 0.049, + "args": { + "External id": 451856,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9471 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352611.112, "dur": 0.066, + "args": { + "External id": 451857,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9472 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352611.431, "dur": 0.047, + "args": { + "External id": 451858,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9473 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352612.151, "dur": 0.058, + "args": { + "External id": 451859,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9474 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352612.460, "dur": 0.048, + "args": { + "External id": 451860,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9475 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352612.958, "dur": 0.059, + "args": { + "External id": 451861,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9476 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352613.264, "dur": 0.045, + "args": { + "External id": 451862,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9477 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352613.784, "dur": 0.058, + "args": { + "External id": 451863,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9478 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352614.090, "dur": 0.046, + "args": { + "External id": 451864,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9479 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352614.764, "dur": 0.059, + "args": { + "External id": 451865,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9480 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352615.065, "dur": 0.044, + "args": { + "External id": 451866,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9481 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352615.953, "dur": 0.068, + "args": { + "External id": 451867,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9482 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352616.318, "dur": 0.066, + "args": { + "External id": 451868,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9483 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352617.192, "dur": 0.052, + "args": { + "External id": 451869,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9484 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352617.493, "dur": 0.052, + "args": { + "External id": 451870,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9485 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352618.329, "dur": 0.067, + "args": { + "External id": 451871,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9486 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352618.645, "dur": 0.055, + "args": { + "External id": 451872,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9487 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352619.493, "dur": 0.070, + "args": { + "External id": 451873,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9488 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352619.811, "dur": 0.051, + "args": { + "External id": 451874,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9489 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352620.696, "dur": 0.068, + "args": { + "External id": 451875,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9490 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352621.016, "dur": 0.261, + "args": { + "External id": 451876,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9491 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352621.678, "dur": 0.319, + "args": { + "External id": 451877,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9492 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352622.244, "dur": 0.076, + "args": { + "External id": 451878,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9493 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352623.019, "dur": 0.298, + "args": { + "External id": 451879,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9494 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352623.567, "dur": 0.262, + "args": { + "External id": 451880,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9495 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352624.517, "dur": 0.068, + "args": { + "External id": 451881,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9496 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352624.839, "dur": 0.078, + "args": { + "External id": 451882,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9497 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352625.548, "dur": 0.065, + "args": { + "External id": 451883,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9498 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352625.860, "dur": 0.075, + "args": { + "External id": 451884,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9499 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352626.662, "dur": 0.273, + "args": { + "External id": 451885,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9500 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352627.183, "dur": 0.094, + "args": { + "External id": 451886,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9501 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352627.938, "dur": 0.069, + "args": { + "External id": 451887,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9502 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352628.522, "dur": 0.051, + "args": { + "External id": 451888,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9503 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352629.062, "dur": 0.071, + "args": { + "External id": 451889,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9504 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352629.381, "dur": 0.055, + "args": { + "External id": 451890,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9505 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352629.890, "dur": 0.074, + "args": { + "External id": 451891,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9506 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352630.213, "dur": 0.052, + "args": { + "External id": 451892,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9507 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352630.743, "dur": 0.067, + "args": { + "External id": 451893,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9508 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352631.057, "dur": 0.056, + "args": { + "External id": 451894,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9509 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352631.967, "dur": 0.065, + "args": { + "External id": 451895,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9510 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352632.282, "dur": 0.051, + "args": { + "External id": 451896,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9511 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352632.924, "dur": 0.067, + "args": { + "External id": 451897,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9512 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352633.243, "dur": 0.049, + "args": { + "External id": 451898,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9513 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352633.944, "dur": 0.070, + "args": { + "External id": 451899,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9514 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352634.261, "dur": 0.049, + "args": { + "External id": 451900,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9515 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352634.917, "dur": 0.067, + "args": { + "External id": 451901,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9516 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352635.236, "dur": 0.054, + "args": { + "External id": 451902,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9517 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352635.760, "dur": 0.069, + "args": { + "External id": 451903,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9518 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352636.076, "dur": 0.051, + "args": { + "External id": 451904,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9519 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 4183441, "tid": 4183441, + "ts": 676008352636.619, "dur": 0.064, + "args": { + "External id": 451905,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 9520 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 4183441, "tid": 4183441, + "ts": 676008353124.981, "dur": 2689.790, + "args": { + "External id": 451906,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.00026688081229955959", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 9521 + } + }, + { + "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 4183441, "tid": 4183441, + "ts": 676008355440.761, "dur": 248.540, + "args": { + "External id": 451907,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.00026688081229955959", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 9522 + } + }, + { + "name": "process_name", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 0, + "args": { + "name": "python3.12" + } + }, + { + "name": "process_labels", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 0, + "args": { + "labels": "CPU" + } + }, + { + "name": "process_sort_index", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 0, + "args": { + "sort_index": 4183441 + } + }, + { + "name": "thread_name", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 31362, + "args": { + "name": "thread 31362 (pt_autograd_5)" + } + }, + { + "name": "thread_sort_index", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 31362, + "args": { + "sort_index": 31362 + } + }, + { + "name": "thread_name", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 4183441, + "args": { + "name": "thread 4183441 (python3.12)" + } + }, + { + "name": "thread_sort_index", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 4183441, + "args": { + "sort_index": 4183441 + } + }, + { + "name": "thread_name", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 31362, + "args": { + "name": "thread 31362 (python3.12)" + } + }, + { + "name": "thread_sort_index", "ph": "M", "ts": 676007567592.395, "pid": 4183441, "tid": 31362, + "args": { + "sort_index": 31362 + } + }, + { + "ph": "X", "cat": "Trace", "ts": 676007567525.017, "dur": 788626.339, + "pid": "Spans", "tid": "PyTorch Profiler", + "name": "PyTorch Profiler (0)", + "args": { + "Op count": 0 + } + }, + { + "name": "process_sort_index", "ph": "M", "ts": 676007567525.017, + "pid": "Spans", "tid": 0, + "args": { + "sort_index": 536870912 + } + }, + { + "name": "Iteration Start: PyTorch Profiler", "ph": "i", "s": "g", + "pid": "Traces", "tid": "Trace PyTorch Profiler", "ts": 676007567525.017 + }, + { + "name": "Record Window End", "ph": "i", "s": "g", + "pid": "", "tid": "", "ts": 676008404722.254 + } + ], + "traceName": "exp/mtp.340M.batch16.seqlen4096.context4096.warmup1000.update1.steps100000.lr3e-4.cosine/profile_trace/iteration_23552/rank5_trace.json", + "displayTimeUnit": "ms", + "baseTimeNanoseconds": 1751410836000000000 +} \ No newline at end of file